diff --git a/.gitignore b/.gitignore
index df712fb0f..ef52805cf 100644
--- a/.gitignore
+++ b/.gitignore
@@ -4,6 +4,7 @@ animation.screenflow/
 README_files/
 README.html
 .DS_Store
+test-results/
 python-package/examples/titanic.db
 .quarto
 *.db
diff --git a/js/build.mjs b/js/build.mjs
index 6b95400d0..dda68cb85 100644
--- a/js/build.mjs
+++ b/js/build.mjs
@@ -24,6 +24,14 @@ const jsTargets = [
     source: "src/viz.ts",
     output: "../pkg-r/inst/htmldep/viz.js",
   },
+  {
+    source: "src/schema-display.js",
+    output: "../pkg-py/src/querychat/static/js/schema-display.js",
+  },
+  {
+    source: "src/schema-display.js",
+    output: "../pkg-r/inst/htmldep/schema-display.js",
+  },
 ];
 
 const cssTargets = [
diff --git a/js/src/schema-display.js b/js/src/schema-display.js
new file mode 100644
index 000000000..95966542e
--- /dev/null
+++ b/js/src/schema-display.js
@@ -0,0 +1,229 @@
+let lastDisplay = null;
+let lastDisplayTime = 0;
+const BATCH_MS = 1000;
+let activePanel = null;
+
+// -- Schema text parser --------------------------------------------------
+
+function parseColumnsJson(json) {
+  return JSON.parse(json).map((col) => ({
+    name: col.name,
+    type: col.sql_type,
+    units: col.units || null,
+    description: col.description || null,
+    constraints: col.constraints && col.constraints.length > 0 ? col.constraints.join(', ') : null,
+    range:
+      col.min_val != null && col.max_val != null ? `${col.min_val} to ${col.max_val}` : null,
+    categories:
+      col.categories && col.categories.length > 0
+        ? col.categories.map((v) => `'${v}'`).join(', ')
+        : null,
+  }));
+}
+
+// -- Table rendering -----------------------------------------------------
+
+function esc(s) {
+  return String(s)
+    .replace(/&/g, '&amp;')
+    .replace(/</g, '&lt;')
+    .replace(/>/g, '&gt;')
+    .replace(/"/g, '&quot;');
+}
+
+const TH =
+  'padding:0.35em 0.75em;text-align:left;white-space:nowrap;font-weight:600;' +
+  'border-bottom:2px solid var(--bs-border-color,#dee2e6);' +
+  'background:var(--bs-tertiary-bg,#f8f9fa);' +
+  'position:sticky;top:0;z-index:1;';
+const TD_MONO =
+  'padding:0.3em 0.75em;white-space:nowrap;' +
+  'font-family:var(--bs-font-monospace,monospace);font-size:0.875em;' +
+  'border-bottom:1px solid var(--bs-border-color-translucent,rgba(0,0,0,.08));';
+const TD_WRAP =
+  'padding:0.3em 0.75em;max-width:22em;overflow-wrap:break-word;' +
+  'border-bottom:1px solid var(--bs-border-color-translucent,rgba(0,0,0,.08));';
+const TD_NOWRAP =
+  'padding:0.3em 0.75em;white-space:nowrap;' +
+  'border-bottom:1px solid var(--bs-border-color-translucent,rgba(0,0,0,.08));';
+
+function renderTable(columns) {
+  const rows = columns
+    .map((col) => {
+      let typeCell = esc(col.type);
+      if (col.units) {
+        typeCell += ` <span style="color:var(--bs-secondary-color,#6c757d)">[${esc(col.units)}]</span>`;
+      }
+      const details = col.range
+        ? esc(col.range)
+        : col.categories
+          ? esc(col.categories)
+          : '';
+
+      return (
+        `<tr>` +
+        `<td style="${TD_MONO}">${esc(col.name)}</td>` +
+        `<td style="${TD_MONO}">${typeCell}</td>` +
+        `<td style="${TD_WRAP}">${col.description ? esc(col.description) : ''}</td>` +
+        `<td style="${TD_NOWRAP}">${col.constraints ? esc(col.constraints) : ''}</td>` +
+        `<td style="${TD_WRAP}">${details}</td>` +
+        `</tr>`
+      );
+    })
+    .join('');
+
+  return (
+    `<table style="border-collapse:collapse;min-width:100%;width:max-content;font-size:0.875em;">` +
+    `<thead><tr>` +
+    `<th style="${TH}">Column</th>` +
+    `<th style="${TH}">Type</th>` +
+    `<th style="${TH}">Description</th>` +
+    `<th style="${TH}">Constraints</th>` +
+    `<th style="${TH}">Range / Values</th>` +
+    `</tr></thead>` +
+    `<tbody>${rows}</tbody>` +
+    `</table>`
+  );
+}
+
+// -- Panel positioning & lifecycle ---------------------------------------
+
+const PANEL_STYLE =
+  'position:fixed;z-index:9999;' +
+  'background:var(--bs-body-bg,#fff);color:var(--bs-body-color,#212529);' +
+  'border:1px solid var(--bs-border-color,#dee2e6);' +
+  'border-radius:var(--bs-border-radius,0.375rem);' +
+  'box-shadow:0 4px 16px rgba(0,0,0,.15);' +
+  'overflow:auto;' +
+  'max-height:min(420px,60vh);';
+
+function positionPanel(btn, panel) {
+  const rect = btn.getBoundingClientRect();
+  const vw = window.innerWidth;
+  const vh = window.innerHeight;
+
+  const pw = Math.min(Math.max(360, vw * 0.55), vw - 16);
+  panel.style.width = `${pw}px`;
+  panel.style.left = `${Math.max(8, Math.min(rect.left, vw - pw - 8))}px`;
+
+  // Prefer below; fall back to above if there's more room there
+  const spaceBelow = vh - rect.bottom - 8;
+  const spaceAbove = rect.top - 8;
+  if (spaceBelow >= 120 || spaceBelow >= spaceAbove) {
+    panel.style.top = `${rect.bottom + 4}px`;
+  } else {
+    const panelH = Math.min(420, spaceAbove);
+    panel.style.top = `${Math.max(8, rect.top - panelH - 4)}px`;
+  }
+}
+
+function closePanel() {
+  if (activePanel) {
+    activePanel.panel.hidden = true;
+    activePanel.btn.setAttribute('aria-expanded', 'false');
+    activePanel = null;
+  }
+}
+
+document.addEventListener('click', closePanel);
+document.addEventListener('keydown', (e) => {
+  if (e.key === 'Escape') closePanel();
+});
+window.addEventListener(
+  'scroll',
+  (e) => {
+    if (activePanel && !activePanel.panel.contains(/** @type {Node} */ (e.target))) {
+      closePanel();
+    }
+  },
+  true,
+);
+window.addEventListener('resize', closePanel);
+
+// -- Button + panel construction -----------------------------------------
+
+function createBtn(tableName, columnsJson) {
+  const columns = parseColumnsJson(columnsJson);
+
+  const btn = document.createElement('button');
+  btn.type = 'button';
+  btn.style.cssText =
+    'background:none;border:none;padding:0;color:inherit;' +
+    'text-decoration:underline dotted;cursor:pointer;font-size:inherit;border-radius:2px;';
+  btn.textContent = tableName;
+  btn.setAttribute('aria-label', `Show schema for ${tableName}`);
+  btn.setAttribute('aria-expanded', 'false');
+  btn.setAttribute('aria-haspopup', 'dialog');
+
+  const panel = document.createElement('div');
+  panel.setAttribute('role', 'dialog');
+  panel.setAttribute('aria-label', `${tableName} schema`);
+  panel.style.cssText = PANEL_STYLE;
+  panel.hidden = true;
+  panel.innerHTML = renderTable(columns);
+  document.body.appendChild(panel);
+
+  btn.addEventListener('click', (e) => {
+    e.stopPropagation();
+    if (activePanel && activePanel.panel === panel) {
+      closePanel();
+      return;
+    }
+    closePanel();
+    positionPanel(btn, panel);
+    panel.hidden = false;
+    btn.setAttribute('aria-expanded', 'true');
+    activePanel = { btn, panel };
+  });
+
+  panel.addEventListener('click', (e) => e.stopPropagation());
+
+  return btn;
+}
+
+// -- Focus ring for keyboard users (Bootstrap resets button outline) -----
+
+const style = document.createElement('style');
+style.textContent =
+  '.qc-schema-display button:focus-visible{' +
+  'outline:2px solid currentColor;outline-offset:2px;border-radius:2px}';
+document.head.appendChild(style);
+
+// -- MutationObserver ---------------------------------------------------
+
+function processCollector(sentinel) {
+  const now = Date.now();
+  const tableName = sentinel.dataset.table;
+  const btn = createBtn(tableName, sentinel.dataset.schemaJson);
+
+  if (lastDisplay && document.contains(lastDisplay) && now - lastDisplayTime < BATCH_MS) {
+    lastDisplay.appendChild(document.createTextNode(', '));
+    lastDisplay.appendChild(btn);
+    sentinel.remove();
+  } else {
+    const p = document.createElement('p');
+    p.className = 'qc-schema-display';
+    p.style.cssText =
+      'color:var(--bs-secondary-color,#6c757d);font-size:0.875em;margin:0.1rem 0;';
+    p.appendChild(document.createTextNode('🔍 Fetched schemas: '));
+    p.appendChild(btn);
+    sentinel.replaceWith(p);
+    lastDisplay = p;
+  }
+  lastDisplayTime = now;
+}
+
+new MutationObserver((mutations) => {
+  for (const { addedNodes } of mutations) {
+    for (const node of addedNodes) {
+      if (node.nodeType !== 1) continue;
+      if (/** @type {Element} */ (node).classList.contains('qc-schema-collector')) {
+        processCollector(/** @type {HTMLElement} */ (node));
+      } else {
+        /** @type {Element} */ (node)
+          .querySelectorAll('.qc-schema-collector')
+          .forEach((el) => processCollector(/** @type {HTMLElement} */ (el)));
+      }
+    }
+  }
+}).observe(document.body, { subtree: true, childList: true });
diff --git a/pkg-py/CHANGELOG.md b/pkg-py/CHANGELOG.md
index a00e8722e..384356136 100644
--- a/pkg-py/CHANGELOG.md
+++ b/pkg-py/CHANGELOG.md
@@ -9,13 +9,36 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
 
 ### New features
 
+* `QueryChat()` now supports **multiple related tables**. Register additional tables with `add_table()` and the LLM can reason across all of them — joins, cross-table filters, aggregations. Per-table reactive state (`df()`, `sql()`, `title()`) is accessible via `qc_vals.table("name")` on the value returned by `server()`. (#195)
+
+  ```python
+  qc = QueryChat(orders_df, "orders")
+  qc.add_table(customers_df, "customers")
+
+  qc_vals = qc.server()
+  qc_vals.table("orders").df()
+  qc_vals.table("customers").sql()
+  ```
+
+* A new **`DataDict`** type — integrating with the [data-dict](https://data-dict.tidyverse.org/) spec — lets you annotate tables and columns with plain-English descriptions loaded from a YAML file. This is the preferred way to provide additional context for the data, especially when multiple tables are relevant. The LLM receives these descriptions when it fetches the schema, helping it interpret ambiguous or domain-specific column names without any extra prompting. (#195)
+
+  ```python
+  QueryChat(data_dict="data_dict.yaml")
+  ```
+
 * Added `PinSource`, a data source for chatting with datasets pinned to a [pins](https://pins.rstudio.com/) board. Works with parquet, CSV, JSON, and Arrow pins, and uses the pin's title, description, and tags as the default data description. Install the optional dependency with `pip install querychat[pins]`. (#246)
 
 * File attachments are now enabled by default in the Shiny chat UI. Users can attach images, PDFs, and text files to their messages and the LLM will receive them. Disable with `allow_attachments=False` in `mod_ui()` or `QueryChat.ui()`. (#253)
 
+### Breaking Changes
+
+* The `data_source` property has been removed. Use `qc.table("name").data_source` to read a table's data source, and `qc.add_table(df, "name", replace=True)` to replace it. The `data_source` parameter to `server()` (Shiny) has also been removed; call `add_table()` before `server()` instead. (#195)
+
 ### Improvements
 
 * Chat greetings now use shinychat's greeting API (requires shinychat >= 0.4.0). A provided `greeting` renders instantly when the app loads, and when no `greeting` is given one is generated on demand without being added to the conversation history. Generated greetings are now preserved across bookmark/restore. (#249)
+
+* The system prompt is now lighter: full schema is no longer embedded upfront. Instead the LLM fetches per-table schema on demand via the new `querychat_get_schema` tool — and only when it needs to. When a `DataDict` is provided, the tool skips columns that already have descriptions, so the LLM only pays for what isn't already documented. (#195)
 * The query tool result card now starts collapsed by default. Users can still expand it to see the SQL query and results. Set `QUERYCHAT_TOOL_DETAILS=expanded` to restore the previous behavior. (#239)
 
 ## [0.6.1] - 2026-05-26
@@ -86,6 +109,8 @@ Each framework's `QueryChat` provides `.app()` for quick standalone apps and `.u
 
 ### New features
 
+* Added `PolarsLazySource` to support Polars LazyFrames as data sources. Data stays lazy until the render boundary, enabling efficient handling of large datasets. Pass a `polars.LazyFrame` directly to `QueryChat()` and queries will be executed lazily via Polars' SQLContext.
+
 * `QueryChat.console()` was added to launch interactive console-based chat sessions with your data source, with persistent conversation state across invocations. (#168)
 
 * `QueryChat.client()` can now create standalone querychat-enabled chat clients with configurable tools and callbacks, enabling use outside of Shiny applications. (#168)
diff --git a/pkg-py/docs/build-intro.qmd b/pkg-py/docs/build-intro.qmd
index ecac93711..ad2570559 100644
--- a/pkg-py/docs/build-intro.qmd
+++ b/pkg-py/docs/build-intro.qmd
@@ -4,21 +4,14 @@ title: Intro
 
 While the `.app()` method is a great [quick start](index.qmd#quick-start) for exploring data, building custom apps with querychat unlocks the full power of integrating natural language data exploration with custom visualizations, layouts, and interactivity.
 
-querychat is a particularly good fit for apps that have:
-
-1. **A single data source** (or a set of related tables that can be joined)
-2. **Multiple filters** that let users slice and explore the data in different ways
-3. **Several visualizations and outputs** that all depend on the same filtered data
-
-In these apps, querychat can replace or augment your filtering UI by allowing users to describe what they want to see in natural language. Instead of building complex filter controls, users can simply ask questions like "show me customers from California who spent over $1000 last quarter" and querychat will generate the appropriate SQL query.
+querychat lets users ask questions of their data in plain language — filtering, sorting, summarizing, joining across tables, and creating visualizations — all without needing to write SQL or navigate complex filter UIs. You can use it as the primary exploration interface in a standalone app, or embed it alongside curated views in an existing dashboard to let users go deeper than the views you designed.
 
 This is especially valuable when:
 
 - Your data has many columns and building a UI for all possible filters would be overwhelming
 - Users want to explore ad-hoc combinations of filters that you didn't anticipate
-- You want to make data exploration more accessible to users who aren't comfortable with traditional filtering UIs
-
-If you have an existing app with a data frame that flows through multiple outputs, querychat can be a natural addition to provide an alternative way to filter that data.
+- You have multiple related tables that users may want to query and join
+- You want to make data exploration more accessible to non-technical users
 
 ## General pattern
 
diff --git a/pkg-py/docs/build.qmd b/pkg-py/docs/build.qmd
index 460d36cc7..68ea3ceb1 100644
--- a/pkg-py/docs/build.qmd
+++ b/pkg-py/docs/build.qmd
@@ -303,22 +303,98 @@ def _():
 Users can also ask the LLM to "reset" or "show all data" to clear filters through the chat interface.
 :::
 
-### Advanced patterns
-
-#### Programmatic updates
+### Programmatic updates
 
 You can update the query state programmatically using `.sql()` and `.title()` as setters. This is useful for adding preset filter buttons or linking filters to other UI controls.
 
-#### Multiple datasets
+## Multiple tables
+
+querychat can work with multiple related tables in a single chat interface, letting users query across tables, join data, and filter any table independently. Register additional tables with `.add_table()` after creating the `QueryChat` instance, then access per-table state through the `.table()` method.
+
+### Registering tables
+
+Pass the first table when creating `QueryChat`, then call `.add_table()` for each additional table:
+
+```python
+from querychat import QueryChat
+
+qc = QueryChat(orders, "orders")
+qc.add_table(customers, "customers")
+qc.add_table(products, "products")
+```
+
+The LLM can query any registered table and write joins across them. You can inspect which tables are registered with `qc.table_names()`.
+
+### Per-table reactive access
+
+When working with multiple tables, access filtered data and SQL for each table individually using `.table()`:
+
+::: {.panel-tabset group="shiny-mode"}
+
+#### Express
+
+```python
+from shiny.express import render
+
+qc.sidebar()
+
+@render.data_frame
+def orders_table():
+    return qc.table("orders").df()
+
+@render.data_frame
+def customers_table():
+    return qc.table("customers").df()
+```
+
+#### Core
 
-To explore multiple datasets, use separate `QueryChat` instances (i.e., separate chat interfaces).
+```python
+def server(input, output, session):
+    qc_vals = qc.server()
 
-::: {.callout-note}
-### Multiple tables in one chat?
+    @render.data_frame
+    def orders_table():
+        return qc_vals.table("orders").df()
+
+    @render.data_frame
+    def customers_table():
+        return qc_vals.table("customers").df()
+```
 
-In some cases, you might be able to "pre-join" datasets into a single table and use one `QueryChat` instance to explore them together. In the future, we may support multiple filtered tables in one chat interface, but this is not currently available. Please upvote [the relevant issue](https://github.com/posit-dev/querychat/issues/6) if this is a feature you'd like to see!
 :::
 
+Each table has its own `.df()`, `.sql()`, and `.title()` reactives that update independently when the user filters that specific table.
+
+### Tracking the active table
+
+Use `.current_table()` to find out which table the LLM most recently queried. This is useful for auto-switching a tabbed UI to the relevant table:
+
+```python
+@reactive.effect
+def _():
+    name = qc_vals.current_table()
+    if name:
+        ui.update_navs("table_tabs", selected=name)
+```
+
+### Data dictionary
+
+When working with multiple related tables, providing a [data dictionary](context.qmd#data-dictionary) is strongly recommended. It tells the LLM how tables relate to each other, which columns are keys, and what domain terms mean — all of which help it write accurate joins and queries.
+
+```python
+from pathlib import Path
+
+qc = QueryChat(orders, "orders", data_dict=Path("data-dict.yaml"))
+qc.add_table(customers, "customers")
+```
+
+See [Provide context](context.qmd#data-dictionary) for the full data dictionary format.
+
+### Separate chat interfaces
+
+If your tables are truly independent (not related), you may prefer separate `QueryChat` instances, each with its own chat interface:
+
 ```{python}
 # | eval: false
 # | code-fold: true
@@ -328,10 +404,6 @@ In some cases, you might be able to "pre-join" datasets into a single table and
 
 ![](/images/multiple-datasets.png){fig-alt="Screenshot of a querychat app with two datasets: titanic and penguins." class="lightbox shadow rounded mb-3"}
 
-::: {.callout-note}
-Each dataset gets its own chat interface and maintains separate state.
-:::
-
 ## See also
 
 - [Greet users](greet.qmd) - Create welcoming onboarding experiences
diff --git a/pkg-py/docs/context.qmd b/pkg-py/docs/context.qmd
index df6cb25ae..123335dc0 100644
--- a/pkg-py/docs/context.qmd
+++ b/pkg-py/docs/context.qmd
@@ -2,73 +2,135 @@
 title: Provide context
 ---
 
-querychat automatically gathers information about your table to help the LLM write accurate SQL queries. This includes column names and types, numerical ranges, and categorical value examples.^[All of this information is provided to the LLM as part of the **system prompt** -- a string of text containing instructions and context for the LLM to consider when responding to user queries.]
+querychat automatically gathers schema information about your tables — column names, types, numerical ranges, and categorical values — and makes it available to the LLM on demand via the `querychat_get_schema` [tool](tools.qmd#schema-retrieval). The LLM calls this tool before writing SQL to understand the structure of the tables it's querying.
 
 Importantly, we are **not** sending your raw data to the LLM and asking it to do complicated math. The LLM only needs to understand the structure and schema of your data in order to write SQL queries.
 
-You can get even better results by customizing the system prompt in three ways:
+You can get even better results by providing additional context:
 
-1. Add a [data description](#data-description) to provide more context about what the data represents
-2. Add [custom instructions](#extra-instructions) to guide the LLM's behavior
-3. Use a fully [custom prompt template](#custom-template) if you want complete control (useful if you want to be certain the model cannot see any literal values from your data)
+1. Add a [data dictionary](#data-dictionary) to describe tables, columns, relationships, and domain terminology (recommended)
+2. Add a [data description](#data-description) for a simpler alternative when working with a single, straightforward table
+3. Add [custom instructions](#extra-instructions) to guide the LLM's behavior
+4. Use a fully [custom prompt template](#custom-template) if you want complete control
 
-## Default prompt
+## Data dictionary {#data-dictionary}
 
-For full visibility into the system prompt that querychat generates for the LLM, you can inspect the `system_prompt` property. This is useful for debugging and understanding exactly what context the LLM is using:
+A **data dictionary** is a YAML file that describes your tables, columns, relationships, and domain-specific terminology. It's the recommended way to provide context, especially when working with [multiple tables](build.qmd#multiple-tables) or when your data has domain-specific meaning that isn't obvious from column names alone.
 
-```python
+```{.python filename="app.py"}
+from pathlib import Path
 from querychat import QueryChat
-from querychat.data import titanic
 
-qc = QueryChat(titanic(), "titanic")
-print(qc.system_prompt)
+qc = QueryChat(
+    orders, "orders",
+    data_dict=Path("data-dict.yaml")
+)
+qc.add_table(customers, "customers")
 ```
 
-By default, the system prompt contains the following components:
+### Format
+
+A data dictionary has three top-level sections: `tables`, `relationships`, and `glossary`.
+
+```{.yaml filename="data-dict.yaml"}
+version: "0.2.0"
+
+tables:
+  orders:
+    description: One row per customer order.
+    columns:
+      - name: order_id
+        type: number(id)
+        constraints: [primary_key]
+        description: Unique order identifier.
+      - name: customer_id
+        type: number(id)
+        constraints: [foreign_key]
+        description: References customers.id.
+      - name: total
+        type: number(quantity)
+        description: Order total in USD.
+      - name: status
+        type: enum
+        values: [pending, shipped, delivered, cancelled]
+        description: Current order status.
+
+  customers:
+    description: One row per customer.
+    columns:
+      - name: id
+        type: number(id)
+        constraints: [primary_key]
+        description: Unique customer identifier.
+      - name: name
+        type: string
+        description: Full name.
+      - name: region
+        type: string
+        description: Geographic sales region.
+
+relationships:
+  - description: Each order belongs to one customer.
+    cardinality: many-to-one
+    join: orders.customer_id = customers.id
+
+glossary:
+  AOV: Average order value — total revenue divided by number of orders.
+  churn: A customer who has not placed an order in the last 90 days.
+```
+
+#### Tables
+
+Each entry under `tables` describes one table. The key must match the table name you pass to `QueryChat` or `.add_table()`.
+
+- **`description`**: What this table represents (one sentence is usually enough).
+- **`columns`**: A list of column annotations. Each column can have:
+  - `name`: Column name (must match the actual column)
+  - `type`: Semantic type hint — `string`, `number`, `number(id)`, `number(quantity)`, `date`, `enum`
+  - `constraints`: Optional list — `primary_key`, `foreign_key`
+  - `description`: What this column means in plain English
+  - `values`: For `enum` columns, the list of possible values
+
+Columns listed in the data dictionary are excluded from the auto-generated schema (since your description supersedes the auto-detected metadata). Columns not listed are still auto-detected as usual.
+
+#### Relationships
+
+The `relationships` section tells the LLM how to join tables. Each entry has:
 
-1. The basic set of behaviors and guidelines the LLM must follow in order for querychat to work properly, including how to use [tools](tools.qmd) to execute queries and update the app.
-2. The SQL schema of the data frame you provided. This includes:
-    - Column names
-    - Data types (integer, float, boolean, datetime, text)
-    - For text columns with less than 10 unique values, we assume they are categorical variables and include the list of values
-    - For integer and float columns, we include the range
-3. A [data description](#data-description) (if provided via `data_description`)
-4. [Additional instructions](#additional-instructions) you want to use to guide querychat's behavior (if provided via `extra_instructions`).
+- `description`: A plain-English description of the relationship
+- `cardinality`: `one-to-one`, `one-to-many`, or `many-to-one`
+- `join`: The join condition (e.g., `orders.customer_id = customers.id`)
+
+#### Glossary
+
+The `glossary` section defines domain-specific terms that users might use in their questions. This helps the LLM translate business language into correct SQL.
 
 
 ## Data description {#data-description}
 
-If your column names are descriptive, querychat may already work well without additional context. However, if your columns are named `x`, `V1`, `value`, etc., you should provide a data description. Use the `data_description` parameter for this:
+For simple single-table use cases where a full data dictionary would be overkill, you can provide a **data description** — a free-form markdown file or string that describes what the data represents. Use the `data_description` parameter:
 
-```{.python filename="titanic-app.py"}
+```python
 from pathlib import Path
-from querychat import QueryChat
 
 qc = QueryChat(
     titanic,
     "titanic",
     data_description=Path("data_description.md")
 )
-app = qc.app()
 ```
 
-querychat doesn't need this information in any particular format -- just provide what a human would find helpful:
+querychat doesn't need this in any particular format — just provide what a human would find helpful:
 
 ```{.markdown filename="data_description.md"}
-This dataset contains information about Titanic passengers, collected for predicting survival.
+This dataset contains information about Titanic passengers.
 
 - survived: Survival (0 = No, 1 = Yes)
 - pclass: Ticket class (1 = 1st, 2 = 2nd, 3 = 3rd)
-- sex: Sex of passenger
-- age: Age in years
-- sibsp: Number of siblings/spouses aboard
-- parch: Number of parents/children aboard
-- fare: Passenger fare
 - embarked: Port of embarkation (C = Cherbourg, Q = Queenstown, S = Southampton)
 ```
 
 
-
 ## Additional instructions {#extra-instructions}
 
 You can add custom instructions to guide the LLM's behavior using the `extra_instructions` parameter:
@@ -86,7 +148,7 @@ Or as a string:
 ```python
 instructions = """
 - Use British spelling conventions
-- Stay on topic and only discuss the data dashboard
+- Stay on topic and only discuss the data
 - Refuse to answer unrelated questions
 """
 
@@ -98,6 +160,17 @@ qc = QueryChat(titanic, "titanic", extra_instructions=instructions)
 LLMs may not always follow your instructions perfectly. Test extensively when changing instructions or models.
 :::
 
+## Default prompt
+
+For full visibility into the system prompt that querychat generates for the LLM, you can inspect the `system_prompt` property. This is useful for debugging and understanding exactly what context the LLM is working with:
+
+```python
+from querychat import QueryChat
+from querychat.data import titanic
+
+qc = QueryChat(titanic(), "titanic")
+print(qc.system_prompt)
+```
 
 ## Custom template {#custom-template}
 
diff --git a/pkg-py/docs/index.qmd b/pkg-py/docs/index.qmd
index 8d119ae3b..d571e333b 100644
--- a/pkg-py/docs/index.qmd
+++ b/pkg-py/docs/index.qmd
@@ -126,8 +126,7 @@ pip install "querychat[streamlit]"  # or [gradio] or [dash]
 
 ## Build custom apps
 
-querychat is designed to be highly extensible -- it provides programmatic access to the chat interface, the filtered/sorted data frame, SQL queries, and more.
-This makes it easy to build custom web apps that leverage natural language interaction with your data.
+querychat is designed to be highly extensible — it provides programmatic access to the chat interface, the filtered/sorted data frame, SQL queries, and more. You can register [multiple related tables](build.qmd#multiple-tables) for cross-table queries and joins, and connect all of it to your own visualizations and layouts.
 For example, [here](https://github.com/posit-conf-2025/llm/blob/main/_solutions/25_querychat/25_querychat_02-end-app.R)'s a bespoke app for exploring Airbnb listings in Ashville, NC:
 
 ![](/images/airbnb.png){fig-alt="A custom app for exploring Airbnb listings, powered by querychat." class="lightbox shadow rounded mb-3"}
@@ -136,9 +135,9 @@ To learn more, see the build guides for your framework: [Shiny](build.qmd), [Str
 
 ## How it works
 
-querychat uses LLMs to translate natural language into SQL queries. Models of all sizes, from small ones you can run locally to large frontier models from major AI providers, are remarkably effective at this task. But even the best models need to understand your data's overall structure to perform well.
+querychat uses LLMs to translate natural language into SQL queries. Models of all sizes, from small ones you can run locally to large frontier models from major AI providers, are remarkably effective at this task. But even the best models need to understand your data's structure to perform well.
 
-To address this, querychat includes schema metadata -- column names, types, ranges, categorical values -- in the LLM's [system prompt](context.qmd). Importantly, querychat **does not** send raw data to the LLM; it shares only enough structural information for the model to generate accurate queries. When the LLM produces a query, querychat executes it in a SQL database (DuckDB[^duckdb], by default) to obtain precise results.
+To address this, querychat provides a schema retrieval [tool](tools.qmd#schema-retrieval) that the LLM calls on demand to learn about table structure — column names, types, ranges, and categorical values. You can further improve results by providing a [data dictionary](context.qmd#data-dictionary) with column descriptions, table relationships, and domain terminology. Importantly, querychat **does not** send raw data to the LLM; it shares only enough structural information for the model to generate accurate queries. When the LLM produces a query, querychat executes it in a SQL database (DuckDB[^duckdb], by default) to obtain precise results.
 
 This design makes querychat reliable, safe, and reproducible:
 
diff --git a/pkg-py/docs/tools.qmd b/pkg-py/docs/tools.qmd
index 44301f1d4..702bc865d 100644
--- a/pkg-py/docs/tools.qmd
+++ b/pkg-py/docs/tools.qmd
@@ -2,14 +2,24 @@
 title: Tools
 ---
 
-querychat combines [tool calling](https://posit-dev.github.io/chatlas/get-started/tools.html) with [reactivity](https://shiny.posit.co/py/docs/reactive-foundations.html) to not only execute SQL, but also reactively update dependent data views. Understanding how these tools work will help you better understand what querychat is capable of and how to customize/extend to its behavior. 
+querychat combines [tool calling](https://posit-dev.github.io/chatlas/get-started/tools.html) with [reactivity](https://shiny.posit.co/py/docs/reactive-foundations.html) to not only execute SQL, but also reactively update dependent data views. Understanding how these tools work will help you better understand what querychat is capable of and how to customize/extend its behavior.
 
 One important thing to understand generally about querychat's tools is they are Python functions, and that execution happens on _your machine_, not on the LLM provider's side. In other words, the SQL queries generated by the LLM are executed locally in the Python process running the app.
 
-querychat provides the LLM access to three tool groups:
+querychat provides the LLM access to four tool groups:
 
-1. **Data updating** - Filter and sort data (without sending results to the LLM).
-2. **Data analysis** - Calculate summaries and return results for interpretation by the LLM.
+1. **Schema retrieval** - Fetch table structure before writing SQL.
+2. **Data updating** - Filter and sort data (without sending results to the LLM).
+3. **Data analysis** - Calculate summaries and return results for interpretation by the LLM.
+4. **Data visualization** - Create charts inline in the chat.
+
+## Schema retrieval {#schema-retrieval}
+
+Before writing any SQL query, the LLM calls the `querychat_get_schema` tool to retrieve column names, types, value ranges, and descriptions for a specific table. This on-demand approach means the LLM only fetches schema for the tables it actually needs, keeping the system prompt lean and startup fast — especially when working with [multiple tables](build.qmd#multiple-tables) or large databases.
+
+If you've provided a [data dictionary](context.qmd#data-dictionary), the schema response includes your column descriptions and relationship information. Columns annotated in the data dictionary are excluded from the auto-generated schema metadata (since your description supersedes it).
+
+This tool is always registered and cannot be disabled.
 
 ## Data updating
 
@@ -61,7 +71,7 @@ This tool:
 2. Renders the `VISUALISE` clause as an Altair chart
 3. Displays the chart inline in the chat
 
-Unlike the data updating tools, visualization queries don't affect the dashboard filter.
+Unlike the data updating tools, visualization queries don't affect the active data filter.
 They query the full dataset independently, and each call produces a new inline chart message in the chat.
 
 The inline chart includes controls for fullscreen viewing, saving as PNG/SVG, and a "Show Query" toggle that reveals the underlying ggsql code.
@@ -96,6 +106,7 @@ If you'd like to better understand how the tools work and how the LLM is prompte
 
 **Prompts:**
 
+- [`prompts/tool-get-schema.md`](https://github.com/posit-dev/querychat/blob/main/pkg-py/src/querychat/prompts/tool-get-schema.md)
 - [`prompts/tool-update-dashboard.md`](https://github.com/posit-dev/querychat/blob/main/pkg-py/src/querychat/prompts/tool-update-dashboard.md)
 - [`prompts/tool-reset-dashboard.md`](https://github.com/posit-dev/querychat/blob/main/pkg-py/src/querychat/prompts/tool-reset-dashboard.md)
 - [`prompts/tool-query.md`](https://github.com/posit-dev/querychat/blob/main/pkg-py/src/querychat/prompts/tool-query.md)
diff --git a/pkg-py/examples/11-multi-table-nutrition/app.py b/pkg-py/examples/11-multi-table-nutrition/app.py
new file mode 100644
index 000000000..0a6e5ac88
--- /dev/null
+++ b/pkg-py/examples/11-multi-table-nutrition/app.py
@@ -0,0 +1,290 @@
+"""USDA Foundation Foods nutrition dashboard with querychat.
+
+Real nutrition data from the USDA Foundation Foods dataset (via the {foodbank}
+R package), organized across six tables:
+  foods, food_categories, nutrients, food_nutrients, food_portions, measure_units
+
+The main content area shows reactive value boxes and Plotly Express charts that
+update whenever querychat filters the data.
+
+Usage:
+    cd pkg-py
+    uv run shiny run examples/multi-table-nutrition.py
+"""
+from pathlib import Path
+
+import plotly.express as px
+import polars as pl
+import shinychat
+from shiny import App, reactive, render, ui
+from shinywidgets import output_widget, render_plotly
+
+from querychat import QueryChat
+
+# ── Data ─────────────────────────────────────────────────────────────────────
+
+_DATA_DIR = Path(__file__).parent / "data" / "foodbank"
+
+foods = pl.read_parquet(_DATA_DIR / "foods.parquet")
+food_categories = pl.read_parquet(_DATA_DIR / "food_categories.parquet")
+nutrients = pl.read_parquet(_DATA_DIR / "nutrients.parquet")
+food_nutrients = pl.read_parquet(_DATA_DIR / "food_nutrients.parquet")
+food_portions = pl.read_parquet(_DATA_DIR / "food_portions.parquet")
+measure_units = pl.read_parquet(_DATA_DIR / "measure_units.parquet")
+
+# Mapping from USDA nutrient ID to friendly column name
+_NUTRIENT_ID_TO_COL = {
+    1008: "energy_kcal",
+    1003: "protein_g",
+    1004: "fat_g",
+    1005: "carbs_g",
+    1079: "fiber_g",
+    1063: "sugars_g",
+    1258: "sat_fat_g",
+    1087: "calcium_mg",
+    1089: "iron_mg",
+    1093: "sodium_mg",
+    1162: "vitamin_c_mg",
+    1092: "potassium_mg",
+}
+
+_col_map = pl.DataFrame(
+    {
+        "nutrient_id": list(_NUTRIENT_ID_TO_COL.keys()),
+        "col": list(_NUTRIENT_ID_TO_COL.values()),
+    }
+).with_columns(pl.col("nutrient_id").cast(pl.Int32))
+
+_wide_nutrients = (
+    food_nutrients.join(_col_map, on="nutrient_id", how="left").pivot(
+        index="fdc_id", on="col", values="amount"
+    )
+)
+
+foods_wide = (
+    foods.join(
+        food_categories.select(["id", "description"]).rename(
+            {"description": "category"}
+        ),
+        left_on="food_category_id",
+        right_on="id",
+        how="left",
+    ).join(_wide_nutrients, on="fdc_id", how="left")
+)
+
+# ── QueryChat ─────────────────────────────────────────────────────────────────
+
+qc = QueryChat(
+    foods,
+    "foods",
+    data_dict=Path(__file__).parent / "nutrition-data-dict.yaml",
+    greeting="",
+)
+qc.add_table(food_categories, "food_categories")
+qc.add_table(nutrients, "nutrients")
+qc.add_table(food_nutrients, "food_nutrients")
+qc.add_table(food_portions, "food_portions")
+qc.add_table(measure_units, "measure_units")
+
+_GREETING = shinychat.chat_greeting(
+    "## USDA Foundation Foods Explorer\n\n"
+    "Real nutrition data for **436 foods** across 19 categories — "
+    "macronutrients, minerals, vitamins, and serving sizes.\n\n"
+    "**Filter this view**\n\n"
+    '<span class="suggestion">Show only foods where fiber exceeds sugar</span>\n\n'
+    '<span class="suggestion">High-protein, low-fat foods: protein > 20g and fat < 5g per 100g</span>\n\n'
+    '<span class="suggestion">Foods higher in potassium than sodium</span>\n\n'
+    "**Dig deeper**\n\n"
+    '<span class="suggestion">Which fruits or vegetables beat whole milk for calcium?</span>\n\n'
+    '<span class="suggestion">Rank all foods by protein per calorie</span>\n\n'
+    '<span class="suggestion">For 1 cup of oats, how much protein and fiber am I getting?</span>\n\n'
+)
+
+# ── App ───────────────────────────────────────────────────────────────────────
+
+
+def app_ui(request):
+    return ui.page_sidebar(
+        ui.sidebar(
+            qc.ui(greeting=_GREETING),
+            width=400,
+            height="100%",
+            fillable=True,
+            class_="querychat-sidebar",
+        ),
+        ui.layout_columns(
+            ui.value_box(
+                "Foods",
+                ui.output_text("n_foods"),
+                showcase=ui.tags.span("🍽️", style="font-size:2rem"),
+                theme="primary",
+            ),
+            ui.value_box(
+                "Avg Protein",
+                ui.output_text("avg_protein"),
+                showcase=ui.tags.span("🥩", style="font-size:2rem"),
+                theme="success",
+            ),
+            ui.value_box(
+                "Avg Fiber",
+                ui.output_text("avg_fiber"),
+                showcase=ui.tags.span("🥦", style="font-size:2rem"),
+                theme="info",
+            ),
+            ui.value_box(
+                "Avg Calories",
+                ui.output_text("avg_calories"),
+                showcase=ui.tags.span("🔥", style="font-size:2rem"),
+                theme="warning",
+            ),
+            col_widths=[3, 3, 3, 3],
+            gap="1rem",
+            fill=False,
+        ),
+        ui.layout_columns(
+            ui.card(
+                ui.card_header(ui.output_text("protein_chart_title")),
+                output_widget("protein_chart"),
+                full_screen=True,
+            ),
+            ui.card(
+                ui.card_header("Avg protein by category (top 10)"),
+                output_widget("macro_chart"),
+                full_screen=True,
+            ),
+        ),
+        ui.navset_card_underline(
+            *[
+                ui.nav_panel(name, ui.output_data_frame(f"dt_{name}"))
+                for name in qc.table_names()
+            ],
+            id="table_tabs",
+            full_screen=True,
+        ),
+        title="USDA Foundation Foods",
+        fillable=True,
+        class_="bslib-page-dashboard",
+    )
+
+
+def server(input, output, session):
+    qc_vals = qc.server()
+
+    @reactive.calc
+    def current_subset() -> pl.DataFrame:
+        queried = qc_vals.table("foods").df()
+        # queried may be polars or pandas depending on the data source
+        if hasattr(queried, "to_pandas"):  # polars DataFrame
+            ids = queried["fdc_id"].to_list()
+        else:  # pandas DataFrame
+            ids = queried["fdc_id"].tolist()
+        return foods_wide.filter(pl.col("fdc_id").is_in(ids))
+
+    @render.text
+    def n_foods():
+        return str(current_subset().height)
+
+    @render.text
+    def avg_protein():
+        v = current_subset()["protein_g"].drop_nulls().mean()
+        return f"{v:.1f} g" if v is not None else "—"
+
+    @render.text
+    def avg_fiber():
+        v = current_subset()["fiber_g"].drop_nulls().mean()
+        return f"{v:.1f} g" if v is not None else "—"
+
+    @render.text
+    def avg_calories():
+        v = current_subset()["energy_kcal"].drop_nulls().mean()
+        return f"{v:.0f} kcal" if v is not None else "—"
+
+    @render.text
+    def protein_chart_title():
+        n = current_subset().filter(pl.col("protein_g").is_not_null()).height
+        shown = min(n, 15)
+        return f"Top {shown} foods by protein (g/100g)"
+
+    @render_plotly
+    def protein_chart():
+        df = (
+            current_subset()
+            .filter(pl.col("protein_g").is_not_null())
+            .sort("protein_g", descending=True)
+            .head(15)
+            .with_columns(
+                pl.col("description")
+                .str.slice(0, 35)
+                .str.replace(r"(.{35}).+", "${1}…")
+                .alias("label")
+            )
+        )
+        fig = px.bar(
+            df,
+            x="protein_g",
+            y="label",
+            orientation="h",
+            hover_data={"category": True, "label": False, "description": True},
+            labels={"protein_g": "Protein (g/100g)", "label": ""},
+            color_discrete_sequence=["#2196F3"],
+        )
+        fig.update_layout(
+            showlegend=False,
+            yaxis={"categoryorder": "total ascending"},
+            margin={"l": 10, "r": 40, "t": 10, "b": 40},
+        )
+        return fig
+
+    @render_plotly
+    def macro_chart():
+        subset = current_subset()
+        # Limit to top 10 categories by food count to keep the chart readable
+        top_cats = (
+            subset.group_by("category")
+            .len()
+            .sort("len", descending=True)
+            .head(10)["category"]
+        )
+        agg = (
+            subset.filter(pl.col("category").is_in(top_cats))
+            .group_by("category")
+            .agg(pl.col("protein_g").mean().alias("avg_protein"))
+            .sort("avg_protein", descending=True)
+        )
+        fig = px.bar(
+            agg,
+            x="avg_protein",
+            y="category",
+            orientation="h",
+            labels={"avg_protein": "Avg protein (g/100g)", "category": ""},
+            color_discrete_sequence=["#4CAF50"],
+        )
+        fig.update_layout(
+            showlegend=False,
+            yaxis={"categoryorder": "total ascending"},
+            margin={"l": 10, "r": 10, "t": 10, "b": 10},
+        )
+        return fig
+
+    # Auto-switch tab when LLM queries a table
+    @reactive.effect
+    def _switch_tab():
+        name = qc_vals.current_table()
+        if name is not None:
+            ui.update_navs("table_tabs", selected=name)
+
+    # Register one data frame render per table.
+    # Value boxes and charts above remain tied to the `foods` table — they
+    # use foods-specific wide-format joins and are not generic per-table views.
+    def _make_dt_renderer(table_name: str):
+        @render.data_frame
+        def _renderer():
+            return qc_vals.table(table_name).df()
+
+        return _renderer
+
+    for _tname in qc.table_names():
+        output(id=f"dt_{_tname}")(_make_dt_renderer(_tname))
+
+
+app = App(app_ui, server)
diff --git a/pkg-py/examples/11-multi-table-nutrition/data/extract_foodbank.R b/pkg-py/examples/11-multi-table-nutrition/data/extract_foodbank.R
new file mode 100644
index 000000000..f3b575db8
--- /dev/null
+++ b/pkg-py/examples/11-multi-table-nutrition/data/extract_foodbank.R
@@ -0,0 +1,59 @@
+#!/usr/bin/env Rscript
+# Extract USDA Foundation Foods data from the {foodbank} R package and write
+# as parquet files for use in the multi-table-nutrition Shiny for Python app.
+#
+# Run from the pkg-py/examples directory:
+#   Rscript data/extract_foodbank.R
+#
+# Requires: foodbank (github::hadley/foodbank), nanoparquet
+#   pak::pkg_install(c("hadley/foodbank", "nanoparquet"))
+
+library(foodbank)
+library(nanoparquet)
+
+script_dir <- tryCatch(
+  dirname(normalizePath(sys.frame(1)$ofile)),
+  error = function(e) getwd()
+)
+out_dir <- file.path(script_dir, "foodbank")
+dir.create(out_dir, showWarnings = FALSE, recursive = TRUE)
+
+# Key nutrient IDs to include (a curated subset of the 477 available)
+key_ids <- c(
+  1008L,  # Energy (kcal)
+  1003L,  # Protein (g)
+  1004L,  # Total lipid / fat (g)
+  1005L,  # Carbohydrate, by difference (g)
+  1079L,  # Fiber, total dietary (g)
+  1063L,  # Sugars, Total (g)
+  1258L,  # Fatty acids, total saturated (g)
+  1087L,  # Calcium, Ca (mg)
+  1089L,  # Iron, Fe (mg)
+  1093L,  # Sodium, Na (mg)
+  1162L,  # Vitamin C, total ascorbic acid (mg)
+  1092L   # Potassium, K (mg)
+)
+
+write_parquet(food,          file.path(out_dir, "foods.parquet"))
+write_parquet(food_category, file.path(out_dir, "food_categories.parquet"))
+write_parquet(
+  nutrient[nutrient$id %in% key_ids, c("id", "name", "unit_name")],
+  file.path(out_dir, "nutrients.parquet")
+)
+write_parquet(
+  food_nutrient[food_nutrient$nutrient_id %in% key_ids,
+                c("fdc_id", "nutrient_id", "amount")],
+  file.path(out_dir, "food_nutrients.parquet")
+)
+write_parquet(
+  food_portion[, c("fdc_id", "seq_num", "amount", "measure_unit_id",
+                   "gram_weight", "modifier")],
+  file.path(out_dir, "food_portions.parquet")
+)
+used_unit_ids <- unique(food_portion$measure_unit_id)
+write_parquet(
+  measure_unit[measure_unit$id %in% used_unit_ids, ],
+  file.path(out_dir, "measure_units.parquet")
+)
+
+cat("Wrote parquet files to", out_dir, "\n")
diff --git a/pkg-py/examples/11-multi-table-nutrition/data/foodbank/food_categories.parquet b/pkg-py/examples/11-multi-table-nutrition/data/foodbank/food_categories.parquet
new file mode 100644
index 000000000..10f6d585a
Binary files /dev/null and b/pkg-py/examples/11-multi-table-nutrition/data/foodbank/food_categories.parquet differ
diff --git a/pkg-py/examples/11-multi-table-nutrition/data/foodbank/food_nutrients.parquet b/pkg-py/examples/11-multi-table-nutrition/data/foodbank/food_nutrients.parquet
new file mode 100644
index 000000000..87edd01ac
Binary files /dev/null and b/pkg-py/examples/11-multi-table-nutrition/data/foodbank/food_nutrients.parquet differ
diff --git a/pkg-py/examples/11-multi-table-nutrition/data/foodbank/food_portions.parquet b/pkg-py/examples/11-multi-table-nutrition/data/foodbank/food_portions.parquet
new file mode 100644
index 000000000..b9fc1b411
Binary files /dev/null and b/pkg-py/examples/11-multi-table-nutrition/data/foodbank/food_portions.parquet differ
diff --git a/pkg-py/examples/11-multi-table-nutrition/data/foodbank/foods.parquet b/pkg-py/examples/11-multi-table-nutrition/data/foodbank/foods.parquet
new file mode 100644
index 000000000..c52fd37fe
Binary files /dev/null and b/pkg-py/examples/11-multi-table-nutrition/data/foodbank/foods.parquet differ
diff --git a/pkg-py/examples/11-multi-table-nutrition/data/foodbank/measure_units.parquet b/pkg-py/examples/11-multi-table-nutrition/data/foodbank/measure_units.parquet
new file mode 100644
index 000000000..7a4019495
Binary files /dev/null and b/pkg-py/examples/11-multi-table-nutrition/data/foodbank/measure_units.parquet differ
diff --git a/pkg-py/examples/11-multi-table-nutrition/data/foodbank/nutrients.parquet b/pkg-py/examples/11-multi-table-nutrition/data/foodbank/nutrients.parquet
new file mode 100644
index 000000000..23c533adb
Binary files /dev/null and b/pkg-py/examples/11-multi-table-nutrition/data/foodbank/nutrients.parquet differ
diff --git a/pkg-py/examples/11-multi-table-nutrition/nutrition-data-dict.yaml b/pkg-py/examples/11-multi-table-nutrition/nutrition-data-dict.yaml
new file mode 100644
index 000000000..a8455e6fc
--- /dev/null
+++ b/pkg-py/examples/11-multi-table-nutrition/nutrition-data-dict.yaml
@@ -0,0 +1,161 @@
+version: "0.2.0"
+
+tables:
+  foods:
+    description: >
+      One row per USDA Foundation Food item. Nutrient values are not stored here —
+      see food_nutrients. All nutrient amounts in food_nutrients are per 100g of the food.
+    columns:
+      - name: fdc_id
+        type: number(id)
+        constraints: [primary_key]
+        description: Unique food identifier from USDA FoodData Central.
+      - name: description
+        type: string
+        description: Full name of the food item (e.g., "Broccoli, raw").
+      - name: food_category_id
+        type: number(id)
+        constraints: [foreign_key]
+        description: Category of the food. Joins to food_categories.id.
+      - name: publication_date
+        type: date
+        description: Date the food record was published by USDA.
+
+  food_categories:
+    description: Lookup table of USDA food categories. One row per category.
+    columns:
+      - name: id
+        type: number(id)
+        constraints: [primary_key]
+        description: Unique category identifier.
+      - name: code
+        type: number
+        description: USDA numeric category code (e.g., 1100 for Vegetables).
+      - name: description
+        type: string
+        description: Human-readable category name (e.g., "Vegetables and Vegetable Products").
+
+  nutrients:
+    description: >
+      Registry of the 12 key nutritional compounds tracked in this dataset.
+      One row per nutrient type. See the glossary for the full list of nutrient IDs.
+    columns:
+      - name: id
+        type: number(id)
+        constraints: [primary_key]
+        description: USDA nutrient identifier (e.g., 1003 for Protein).
+      - name: name
+        type: string
+        description: >
+          Official USDA nutrient name (e.g., "Protein", "Total lipid (fat)",
+          "Carbohydrate, by difference").
+      - name: unit_name
+        type: enum
+        values: [G, KCAL, MG]
+        description: Unit of measurement. G = grams, KCAL = kilocalories, MG = milligrams.
+
+  food_nutrients:
+    description: >
+      Nutrient content per 100g of food. One row per food–nutrient combination.
+      Only the 12 key nutrients are included (see nutrients table and glossary).
+      To get nutrient values for a food, join on fdc_id.
+      To get nutrient names and units, join nutrients on nutrient_id.
+    columns:
+      - name: fdc_id
+        type: number(id)
+        constraints: [foreign_key]
+        description: Identifies the food. Joins to foods.fdc_id.
+      - name: nutrient_id
+        type: number(id)
+        constraints: [foreign_key]
+        description: Identifies the nutrient. Joins to nutrients.id.
+      - name: amount
+        type: number(quantity)
+        description: >
+          Amount of the nutrient per 100g of food, in the unit given by
+          nutrients.unit_name. May be null if the nutrient was not measured
+          for this food.
+
+  food_portions:
+    description: >
+      Common serving sizes for foods. One row per portion definition.
+      A single food may have multiple portions (e.g., "1 cup" and "1 oz").
+      Not all foods have portion data — only 116 of the 436 foods are covered.
+    columns:
+      - name: fdc_id
+        type: number(id)
+        constraints: [foreign_key]
+        description: Identifies the food. Joins to foods.fdc_id.
+      - name: seq_num
+        type: number
+        description: Sequence number ordering multiple portions for the same food.
+      - name: amount
+        type: number(quantity)
+        description: >
+          The number of measure units in this portion (e.g., 1.0 for "1 cup",
+          2.0 for "2 tablespoons").
+      - name: measure_unit_id
+        type: number(id)
+        constraints: [foreign_key]
+        description: Unit of the portion. Joins to measure_units.id.
+      - name: gram_weight
+        type: number(quantity)
+        description: Weight in grams of this portion (e.g., 240 for 1 cup of milk).
+      - name: modifier
+        type: string
+        description: >
+          Optional preparation note for the portion (e.g., "chopped", "drained",
+          "cooked"). Null when no modifier applies.
+
+  measure_units:
+    description: >
+      Lookup table of measurement unit names used in food_portions.
+      Only units that appear in food_portions are included (~32 of the 123 total).
+    columns:
+      - name: id
+        type: number(id)
+        constraints: [primary_key]
+        description: Unique unit identifier.
+      - name: name
+        type: string
+        description: >
+          Human-readable unit name (e.g., "cup", "tablespoon", "oz", "slice",
+          "piece", "package").
+
+relationships:
+  - description: Each food belongs to one category.
+    cardinality: many-to-one
+    join: foods.food_category_id = food_categories.id
+  - description: Each food has one row per tracked nutrient.
+    cardinality: one-to-many
+    join: foods.fdc_id = food_nutrients.fdc_id
+  - description: Each nutrient type appears in many food measurements.
+    cardinality: one-to-many
+    join: nutrients.id = food_nutrients.nutrient_id
+  - description: Each food may have one or more common portion sizes.
+    cardinality: one-to-many
+    join: foods.fdc_id = food_portions.fdc_id
+  - description: Each portion references a measurement unit.
+    cardinality: many-to-one
+    join: food_portions.measure_unit_id = measure_units.id
+
+glossary:
+  per 100g: All nutrient amounts in food_nutrients are normalized to a 100-gram serving for fair comparison across foods.
+  fdc_id: USDA FoodData Central identifier — the primary key for food items in this dataset.
+  energy: Total caloric value, measured in kilocalories (kcal). Nutrient ID 1008.
+  macronutrient: One of the three main energy-providing nutrients — protein (ID 1003), fat (ID 1004), or carbohydrates (ID 1005).
+  nutrient IDs: >
+    Key nutrient IDs in this dataset:
+    1003 = Protein (G),
+    1004 = Total lipid / fat (G),
+    1005 = Carbohydrate by difference (G),
+    1008 = Energy (KCAL),
+    1063 = Sugars Total (G),
+    1079 = Fiber total dietary (G),
+    1258 = Fatty acids total saturated (G),
+    1087 = Calcium Ca (MG),
+    1089 = Iron Fe (MG),
+    1093 = Sodium Na (MG),
+    1162 = Vitamin C total ascorbic acid (MG),
+    1092 = Potassium K (MG).
+  gram_weight: The actual weight in grams of a described portion. Use this to convert per-100g nutrient values to per-serving values by multiplying by (gram_weight / 100).
diff --git a/pkg-py/examples/12-multi-table-express.py b/pkg-py/examples/12-multi-table-express.py
new file mode 100644
index 000000000..1f87e0828
--- /dev/null
+++ b/pkg-py/examples/12-multi-table-express.py
@@ -0,0 +1,54 @@
+"""Minimal multi-table querychat example using Shiny Express.
+
+Two related tables (orders + customers) are registered with a single QueryChat
+instance. The LLM can query either table or write joins across them.
+Per-table filtered data is accessed with `qc.table("name").df()`.
+
+Usage:
+    cd pkg-py
+    uv run shiny run examples/12-multi-table-express.py
+"""
+
+import pandas as pd
+from shiny.express import render, ui
+
+from querychat.express import QueryChat
+
+orders = pd.DataFrame(
+    {
+        "order_id": [1, 2, 3, 4, 5],
+        "customer_id": [101, 102, 101, 103, 102],
+        "amount": [250.0, 180.0, 320.0, 90.0, 450.0],
+        "status": ["shipped", "pending", "shipped", "delivered", "pending"],
+    }
+)
+
+customers = pd.DataFrame(
+    {
+        "customer_id": [101, 102, 103],
+        "name": ["Alice", "Bob", "Carol"],
+        "city": ["Boston", "Chicago", "Denver"],
+    }
+)
+
+qc = QueryChat(orders, "orders")
+qc.add_table(customers, "customers")
+qc.sidebar()
+
+with ui.navset_card_underline():
+    with ui.nav_panel("Orders"):
+
+        @render.data_frame
+        def orders_table():
+            return qc.table("orders").df()
+
+    with ui.nav_panel("Customers"):
+
+        @render.data_frame
+        def customers_table():
+            return qc.table("customers").df()
+
+ui.page_opts(
+    title="Orders & Customers",
+    fillable=True,
+)
diff --git a/pkg-py/src/querychat/__init__.py b/pkg-py/src/querychat/__init__.py
index 0e3eaa5f5..953f73840 100644
--- a/pkg-py/src/querychat/__init__.py
+++ b/pkg-py/src/querychat/__init__.py
@@ -1,9 +1,11 @@
+from ._data_dict import DataDict
 from ._deprecated import greeting, init, sidebar, system_prompt
 from ._deprecated import mod_server as server
 from ._deprecated import mod_ui as ui
 from ._shiny import QueryChat
 
 __all__ = (
+    "DataDict",
     "QueryChat",
     # TODO(lifecycle): Remove these deprecated functions when we reach v1.0
     "greeting",
diff --git a/pkg-py/src/querychat/_dash.py b/pkg-py/src/querychat/_dash.py
index da9b57da9..5d4c4df10 100644
--- a/pkg-py/src/querychat/_dash.py
+++ b/pkg-py/src/querychat/_dash.py
@@ -8,12 +8,11 @@
 from narwhals.stable.v1.typing import IntoDataFrameT, IntoFrameT, IntoLazyFrameT
 
 from ._dash_ui import IDs, card_ui, chat_container_ui, chat_messages_ui
-from ._querychat_base import TOOL_GROUPS, QueryChatBase
+from ._querychat_base import TOOL_GROUPS, StateDictQueryChat
 from ._querychat_core import (
     GREETING_PROMPT,
     AppState,
     AppStateDict,
-    StateDictAccessorMixin,
     create_app_state,
     stream_response_async,
 )
@@ -33,8 +32,10 @@
     import dash
     from dash import html
 
+    from ._data_dict import DataDict
 
-class QueryChat(QueryChatBase[IntoFrameT], StateDictAccessorMixin[IntoFrameT]):
+
+class QueryChat(StateDictQueryChat[IntoFrameT]):
     """
     QueryChat for Dash applications.
 
@@ -92,16 +93,17 @@ def update_sql(state):
     @overload
     def __init__(
         self: QueryChat[Any],
-        data_source: None,
-        table_name: str,
+        data_source: None = None,
+        table_name: str | None = None,
         *,
         greeting: Optional[str | PathType] = None,
         client: Optional[str | chatlas.Chat] = None,
         tools: TOOL_GROUPS | tuple[TOOL_GROUPS, ...] | None = ("filter", "query"),
-        data_description: Optional[str | PathType] = None,
-        categorical_threshold: int = 20,
+        data_dict: DataDict | str | PathType | None = None,
         extra_instructions: Optional[str | PathType] = None,
         prompt_template: Optional[str | PathType] = None,
+        categorical_threshold: int = 20,
+        data_description: Optional[str | PathType] = None,
         storage_type: Literal["memory", "session", "local"] = "memory",
     ) -> None: ...
 
@@ -114,10 +116,11 @@ def __init__(
         greeting: Optional[str | PathType] = None,
         client: Optional[str | chatlas.Chat] = None,
         tools: TOOL_GROUPS | tuple[TOOL_GROUPS, ...] | None = ("filter", "query"),
-        data_description: Optional[str | PathType] = None,
-        categorical_threshold: int = 20,
+        data_dict: DataDict | str | PathType | None = None,
         extra_instructions: Optional[str | PathType] = None,
         prompt_template: Optional[str | PathType] = None,
+        categorical_threshold: int = 20,
+        data_description: Optional[str | PathType] = None,
         storage_type: Literal["memory", "session", "local"] = "memory",
     ) -> None: ...
 
@@ -130,10 +133,11 @@ def __init__(
         greeting: Optional[str | PathType] = None,
         client: Optional[str | chatlas.Chat] = None,
         tools: TOOL_GROUPS | tuple[TOOL_GROUPS, ...] | None = ("filter", "query"),
-        data_description: Optional[str | PathType] = None,
-        categorical_threshold: int = 20,
+        data_dict: DataDict | str | PathType | None = None,
         extra_instructions: Optional[str | PathType] = None,
         prompt_template: Optional[str | PathType] = None,
+        categorical_threshold: int = 20,
+        data_description: Optional[str | PathType] = None,
         storage_type: Literal["memory", "session", "local"] = "memory",
     ) -> None: ...
 
@@ -146,10 +150,11 @@ def __init__(
         greeting: Optional[str | PathType] = None,
         client: Optional[str | chatlas.Chat] = None,
         tools: TOOL_GROUPS | tuple[TOOL_GROUPS, ...] | None = ("filter", "query"),
-        data_description: Optional[str | PathType] = None,
-        categorical_threshold: int = 20,
+        data_dict: DataDict | str | PathType | None = None,
         extra_instructions: Optional[str | PathType] = None,
         prompt_template: Optional[str | PathType] = None,
+        categorical_threshold: int = 20,
+        data_description: Optional[str | PathType] = None,
         storage_type: Literal["memory", "session", "local"] = "memory",
     ) -> None: ...
 
@@ -162,25 +167,27 @@ def __init__(
         greeting: Optional[str | PathType] = None,
         client: Optional[str | chatlas.Chat] = None,
         tools: TOOL_GROUPS | tuple[TOOL_GROUPS, ...] | None = ("filter", "query"),
-        data_description: Optional[str | PathType] = None,
-        categorical_threshold: int = 20,
+        data_dict: DataDict | str | PathType | None = None,
         extra_instructions: Optional[str | PathType] = None,
         prompt_template: Optional[str | PathType] = None,
+        categorical_threshold: int = 20,
+        data_description: Optional[str | PathType] = None,
         storage_type: Literal["memory", "session", "local"] = "memory",
     ) -> None: ...
 
     def __init__(
         self,
-        data_source: IntoFrame | sqlalchemy.Engine | ibis.Table | None,
-        table_name: str,
+        data_source: IntoFrame | sqlalchemy.Engine | ibis.Table | None = None,
+        table_name: str | None = None,
         *,
         greeting: Optional[str | PathType] = None,
         client: Optional[str | chatlas.Chat] = None,
         tools: TOOL_GROUPS | tuple[TOOL_GROUPS, ...] | None = ("filter", "query"),
-        data_description: Optional[str | PathType] = None,
-        categorical_threshold: int = 20,
+        data_dict: DataDict | str | PathType | None = None,
         extra_instructions: Optional[str | PathType] = None,
         prompt_template: Optional[str | PathType] = None,
+        categorical_threshold: int = 20,
+        data_description: Optional[str | PathType] = None,
         storage_type: Literal["memory", "session", "local"] = "memory",
     ):
         super().__init__(
@@ -190,12 +197,13 @@ def __init__(
             client=client,
             tools=tools,
             data_description=data_description,
+            data_dict=data_dict,
             categorical_threshold=categorical_threshold,
             extra_instructions=extra_instructions,
             prompt_template=prompt_template,
         )
         self._storage_type: Literal["memory", "session", "local"] = storage_type
-        self._ids = IDs.from_table_name(table_name)
+        self._ids = IDs.from_table_name(table_name or "querychat")
         self._initialized_apps: set[int] = set()
 
     @property
@@ -217,12 +225,18 @@ def app(self) -> dash.Dash:
             A Dash app ready to run.
 
         """
-        data_source = self._require_data_source("app")
+        self._require_initialized("app")
+        if len(self._data_sources) > 1:
+            table_list = ", ".join(f"'{n}'" for n in self._data_sources)
+            raise RuntimeError(
+                f"app() does not support multiple tables ({table_list}). "
+                "Build a custom layout using ui() and table('name') instead."
+            )
         import dash_bootstrap_components as dbc
 
         import dash
 
-        table_name = data_source.table_name
+        table_name = next(iter(self._data_sources))
 
         app = dash.Dash(
             __name__,
@@ -235,7 +249,7 @@ def app(self) -> dash.Dash:
         register_app_callbacks(
             app,
             self._ids,
-            data_source.table_name,
+            table_name,
             self._deserialize_state,
         )
 
@@ -276,13 +290,14 @@ def ui(
         ...     return f"Current SQL: {sql}"
 
         """
-        data_source = self._require_data_source("ui")
+        self._require_initialized("ui")
         from dash import dcc, html
 
         initial_state = create_app_state(
-            data_source,
-            self._client_factory,
-            self.greeting,
+            data_sources=dict(self._data_sources),
+            client_factory=self._client_factory,
+            greeting=self.greeting,
+            query_executor=self._require_query_executor("ui"),
         )
 
         return html.Div(
diff --git a/pkg-py/src/querychat/_data_dict.py b/pkg-py/src/querychat/_data_dict.py
new file mode 100644
index 000000000..6fa909c8c
--- /dev/null
+++ b/pkg-py/src/querychat/_data_dict.py
@@ -0,0 +1,249 @@
+from __future__ import annotations
+
+from pathlib import Path
+from typing import TYPE_CHECKING, Any
+
+from pydantic import BaseModel
+
+if TYPE_CHECKING:
+    from ._datasource import ColumnMeta
+    from ._query_executor import QueryExecutor
+
+
+class ColumnRange(BaseModel):
+    """Inclusive numeric range for a column, used instead of live min/max queries."""
+
+    min: Any = None
+    max: Any = None
+
+
+class ColumnSpec(BaseModel):
+    """
+    Per-column metadata entry in a :class:`DataDict`.
+
+    All fields are optional. Only ``name`` is required, and is used to match
+    this spec against columns returned by the data source.
+
+    Parameters
+    ----------
+    name
+        Column name as it appears in the data source.
+    type
+        Human-readable type override (e.g. ``"date"``, ``"currency"``). When
+        supplied, this replaces the inferred SQL type in the LLM schema view.
+    constraints
+        Free-text constraints conveyed to the LLM (e.g. ``"non-negative"``).
+    description
+        Short description forwarded verbatim to the LLM's schema view.
+    details
+        Longer narrative about the column, used only in the on-demand
+        ``get_schema`` tool response.
+    units
+        Unit label (e.g. ``"kg"``, ``"USD"``), included in the schema view.
+    values
+        Exhaustive list of valid values. Replaces categorical inference for
+        this column — querychat will not query the data source for distinct
+        values when this is set.
+    range
+        Inclusive min/max bounds. Replaces live min/max statistics queries
+        when set.
+    examples
+        Representative sample values shown to the LLM as context.
+
+    """
+
+    name: str
+    type: str | None = None
+    constraints: list[str] = []
+    description: str | None = None
+    details: str | None = None
+    units: str | None = None
+    values: list[Any] | None = None
+    range: ColumnRange | None = None
+    examples: list[Any] | None = None
+
+
+class TableSpec(BaseModel):
+    """
+    Metadata for a single table in a :class:`DataDict`.
+
+    Parameters
+    ----------
+    description
+        Short description of the table, forwarded to the LLM's schema view.
+    details
+        Longer narrative shown only in the on-demand ``get_schema`` tool
+        response.
+    columns
+        Per-column specifications. Columns not listed here are documented
+        using live statistics inferred from the data.
+
+    """
+
+    description: str | None = None
+    details: str | None = None
+    columns: list[ColumnSpec] = []
+
+
+class RelationshipSpec(BaseModel):
+    """
+    A declared relationship between two tables.
+
+    Parameters
+    ----------
+    description
+        Human-readable description of the relationship.
+    cardinality
+        Cardinality string (e.g. ``"one-to-many"``).
+    join
+        SQL JOIN clause or expression that links the tables.
+
+    """
+
+    description: str | None = None
+    cardinality: str | None = None
+    join: str
+
+
+class DataDict(BaseModel):
+    """
+    A data dictionary providing rich per-table and per-column metadata.
+
+    Pass a ``DataDict`` to ``QueryChat`` (or load one from YAML via
+    :meth:`from_yaml`) to give the LLM better context about your data without
+    querying the data source for statistics at startup.
+
+    For columns listed in a ``DataDict``:
+
+    * ``values`` replaces categorical inference (no ``SELECT DISTINCT`` query).
+    * ``range`` replaces live min/max statistics queries.
+    * ``description`` is forwarded verbatim to the LLM's schema view.
+
+    Columns not listed fall back to the normal live-statistics path.
+
+    Parameters
+    ----------
+    name
+        Short identifier for this dictionary's domain (e.g. ``"sales"``).
+        Used as the ``name`` attribute on the ``<data-dict>`` tag in the system
+        prompt. When loading from YAML via :meth:`from_yaml`, defaults to the
+        file stem if not set explicitly.
+    description
+        One-line summary of the domain, shown alongside ``name`` in the
+        system prompt.
+    tables
+        Per-table metadata, keyed by table name. Each value is a
+        :class:`TableSpec` with optional description and column specs.
+        Table names must match those registered with ``QueryChat``.
+    relationships
+        Cross-table relationship declarations. Useful context for multi-table
+        apps where the LLM needs to know how tables join.
+    glossary
+        Domain-specific term definitions passed to the LLM as context
+        (e.g. ``{"ARR": "Annual Recurring Revenue"}``).
+
+    Examples
+    --------
+    Load from a YAML file:
+
+    ```python
+    from querychat import QueryChat, DataDict
+
+    qc = QueryChat(df, "sales", data_dict=DataDict.from_yaml("data_dict.yaml"))
+    ```
+
+    Or pass a path directly and let QueryChat load it:
+
+    ```python
+    qc = QueryChat(df, "sales", data_dict="data_dict.yaml")
+    ```
+
+    """
+
+    name: str | None = None
+    description: str | None = None
+    tables: dict[str, TableSpec] = {}
+    relationships: list[RelationshipSpec] = []
+    glossary: dict[str, str] = {}
+
+    def to_prompt_dict(self) -> dict[str, Any]:
+        """Return a filtered dict for the system prompt (excludes per-column details)."""
+        result: dict[str, Any] = {}
+        if self.name is not None:
+            result["name"] = self.name
+        if self.description is not None:
+            result["description"] = self.description
+        if self.tables:
+            result["tables"] = {
+                name: ({"description": spec.description} if spec.description else None)
+                for name, spec in self.tables.items()
+            }
+        if self.relationships:
+            result["relationships"] = [
+                {k: v for k, v in rel.model_dump().items() if v is not None}
+                for rel in self.relationships
+            ]
+        if self.glossary:
+            result["glossary"] = self.glossary
+        return result
+
+    def get_table_schema(
+        self,
+        table_name: str,
+        executor: QueryExecutor,
+        categorical_threshold: int,
+    ) -> list[ColumnMeta]:
+        # Get authoritative column names + types via cheap LIMIT 0
+        metas: list[ColumnMeta] = executor.get_column_metas(table_name)
+
+        # Build lookup from data_dict for this table
+        table_spec = self.tables.get(table_name)
+        documented: dict[str, ColumnSpec] = (
+            {col.name: col for col in table_spec.columns} if table_spec else {}
+        )
+
+        undocumented: list[ColumnMeta] = []
+        for meta in metas:
+            spec = documented.get(meta.name)
+            if spec is not None:
+                if spec.type is not None:
+                    meta.sql_type = spec.type
+                if spec.range is not None:
+                    meta.min_val = spec.range.min
+                    meta.max_val = spec.range.max
+                if spec.values is not None:
+                    meta.categories = [str(v) for v in spec.values]
+                if spec.description is not None:
+                    meta.description = spec.description
+                if spec.units is not None:
+                    meta.units = spec.units
+                if spec.constraints:
+                    meta.constraints = list(spec.constraints)
+            else:
+                undocumented.append(meta)
+
+        if undocumented:
+            executor.populate_column_stats(table_name, undocumented, categorical_threshold)
+
+        return metas
+
+    @classmethod
+    def from_yaml(cls, path: Path | str) -> DataDict:
+        """
+        Load a :class:`DataDict` from a YAML file.
+
+        Parameters
+        ----------
+        path
+            Path to the YAML file.
+
+        """
+        import yaml
+
+        path = Path(path)
+        with path.open() as f:
+            data = yaml.safe_load(f) or {}
+        dd = cls.model_validate(data)
+        if dd.name is None:
+            dd = dd.model_copy(update={"name": path.stem})
+        return dd
diff --git a/pkg-py/src/querychat/_datasource.py b/pkg-py/src/querychat/_datasource.py
index ed2c8ecd4..55af587db 100644
--- a/pkg-py/src/querychat/_datasource.py
+++ b/pkg-py/src/querychat/_datasource.py
@@ -51,14 +51,30 @@ class ColumnMeta:
     categories: list[str] = field(default_factory=list)
     """Unique values for text columns below the categorical threshold."""
 
+    description: str | None = None
+    """Optional human-readable description of the column."""
+
+    units: str | None = None
+    """Unit label (e.g. 'kg', 'USD')."""
+
+    constraints: list[str] = field(default_factory=list)
+    """Free-text constraints (e.g. 'non-negative')."""
+
 
 def format_schema(table_name: str, columns: list[ColumnMeta]) -> str:
     """Format column metadata into schema string."""
     lines = [f"Table: {table_name}", "Columns:"]
 
     for col in columns:
-        lines.append(f"- {col.name} ({col.sql_type})")
-
+        header = f"- {col.name} ({col.sql_type})"
+        if col.units:
+            header += f" [{col.units}]"
+        lines.append(header)
+
+        if col.description:
+            lines.append(f"  Description: {col.description}")
+        if col.constraints:
+            lines.append(f"  Constraints: {', '.join(col.constraints)}")
         if col.kind in ("numeric", "date") and col.min_val is not None and col.max_val is not None:
             lines.append(f"  Range: {col.min_val} to {col.max_val}")
         elif col.categories:
@@ -152,19 +168,6 @@ def duckdb_column_stats(
         pass
 
 
-def duckdb_get_schema(
-    conn: duckdb.DuckDBPyConnection,
-    table_name: str,
-    categorical_threshold: int,
-) -> str:
-    """Generate schema string from a DuckDB connection and table name."""
-    result = conn.execute(f'SELECT * FROM "{table_name}" LIMIT 0')
-    columns = [
-        duckdb_column_meta(desc[0], desc[1]) for desc in result.description
-    ]
-    duckdb_column_stats(conn, table_name, columns, categorical_threshold)
-    return format_schema(table_name, columns)
-
 
 def duckdb_lock_down(conn: duckdb.DuckDBPyConnection) -> None:
     """Lock down a DuckDB connection to prevent LLM-generated SQL from accessing external resources."""
@@ -220,6 +223,18 @@ def get_schema(self, *, categorical_threshold: int) -> str:
         """
         ...
 
+    @abstractmethod
+    def get_column_metas(self) -> list[ColumnMeta]:
+        """Return column names and types without running stats queries."""
+        ...
+
+    @abstractmethod
+    def populate_column_stats(
+        self, columns: list[ColumnMeta], categorical_threshold: int
+    ) -> None:
+        """Populate min/max/categories on the given ColumnMeta list in place."""
+        ...
+
     @abstractmethod
     def execute_query(self, query: str) -> IntoFrameT:
         """
@@ -368,7 +383,18 @@ def get_schema(self, *, categorical_threshold: int) -> str:
             String describing the schema
 
         """
-        return duckdb_get_schema(self._conn, self.table_name, categorical_threshold)
+        metas = self.get_column_metas()
+        self.populate_column_stats(metas, categorical_threshold)
+        return format_schema(self.table_name, metas)
+
+    def get_column_metas(self) -> list[ColumnMeta]:
+        result = self._conn.execute(f'SELECT * FROM "{self.table_name}" LIMIT 0')
+        return [duckdb_column_meta(desc[0], desc[1]) for desc in result.description]
+
+    def populate_column_stats(
+        self, columns: list[ColumnMeta], categorical_threshold: int
+    ) -> None:
+        duckdb_column_stats(self._conn, self.table_name, columns, categorical_threshold)
 
     def execute_query(self, query: str) -> IntoDataFrameT:
         """
@@ -536,6 +562,11 @@ def get_db_type(self) -> str:
         """
         return self._engine.dialect.name.upper().replace(" SQL", "")
 
+    @property
+    def engine(self) -> Engine:
+        """The SQLAlchemy engine for this data source."""
+        return self._engine
+
     def get_schema(self, *, categorical_threshold: int) -> str:
         """
         Generate schema information from database table.
@@ -552,12 +583,20 @@ def get_schema(self, *, categorical_threshold: int) -> str:
             String describing the schema
 
         """
-        columns = [
+        metas = self.get_column_metas()
+        self.populate_column_stats(metas, categorical_threshold)
+        return format_schema(self.table_name, metas)
+
+    def get_column_metas(self) -> list[ColumnMeta]:
+        return [
             self._make_column_meta(col["name"], col["type"])
             for col in self._columns_info
         ]
+
+    def populate_column_stats(
+        self, columns: list[ColumnMeta], categorical_threshold: int
+    ) -> None:
         self._add_column_stats(columns, categorical_threshold)
-        return format_schema(self.table_name, columns)
 
     def get_semantic_views_description(self) -> str:
         """Get information about semantic views (if any) for the system prompt."""
@@ -827,14 +866,17 @@ def get_db_type(self) -> str:
 
     def get_schema(self, *, categorical_threshold: int) -> str:
         """Generate schema information from LazyFrame using lazy aggregates."""
-        # Build column metadata (classification happens here)
-        columns = [
-            self._make_column_meta(name, dtype) for name, dtype in self._schema.items()
-        ]
+        metas = self.get_column_metas()
+        self.populate_column_stats(metas, categorical_threshold)
+        return format_schema(self.table_name, metas)
+
+    def get_column_metas(self) -> list[ColumnMeta]:
+        return [self._make_column_meta(name, dtype) for name, dtype in self._schema.items()]
 
-        # Add stats to the metadata and format schema string
+    def populate_column_stats(
+        self, columns: list[ColumnMeta], categorical_threshold: int
+    ) -> None:
         self._add_column_stats(columns, self._lf, categorical_threshold)
-        return format_schema(self.table_name, columns)
 
     def execute_query(self, query: str) -> pl.LazyFrame:
         """
@@ -1029,12 +1071,25 @@ def __init__(self, table: ibis.Table, table_name: str):
     def get_db_type(self) -> str:
         return self._backend.name
 
+    @property
+    def backend(self) -> SQLBackend:
+        """The Ibis SQL backend for this data source."""
+        return self._backend
+
     def get_schema(self, *, categorical_threshold: int) -> str:
-        columns = [
+        metas = self.get_column_metas()
+        self.populate_column_stats(metas, categorical_threshold)
+        return format_schema(self.table_name, metas)
+
+    def get_column_metas(self) -> list[ColumnMeta]:
+        return [
             self._make_column_meta(name, dtype) for name, dtype in self._schema.items()
         ]
+
+    def populate_column_stats(
+        self, columns: list[ColumnMeta], categorical_threshold: int
+    ) -> None:
         self._add_column_stats(columns, self._table, categorical_threshold)
-        return format_schema(self.table_name, columns)
 
     def get_semantic_views_description(self) -> str:
         """Get information about semantic views (if any) for the system prompt."""
diff --git a/pkg-py/src/querychat/_gradio.py b/pkg-py/src/querychat/_gradio.py
index cc0067084..18a87cb88 100644
--- a/pkg-py/src/querychat/_gradio.py
+++ b/pkg-py/src/querychat/_gradio.py
@@ -10,11 +10,10 @@
 if TYPE_CHECKING:
     import narwhals.stable.v1 as nw
 
-from ._querychat_base import TOOL_GROUPS, QueryChatBase
+from ._querychat_base import TOOL_GROUPS, StateDictQueryChat
 from ._querychat_core import (
     GREETING_PROMPT,
     AppStateDict,
-    StateDictAccessorMixin,
     create_app_state,
     stream_response,
 )
@@ -31,8 +30,10 @@
 
     import gradio as gr
 
+    from ._data_dict import DataDict
 
-class QueryChat(QueryChatBase[IntoFrameT], StateDictAccessorMixin[IntoFrameT]):
+
+class QueryChat(StateDictQueryChat[IntoFrameT]):
     """
     QueryChat for Gradio applications.
 
@@ -86,16 +87,17 @@ def update_outputs(state_dict):
     @overload
     def __init__(
         self: QueryChat[Any],
-        data_source: None,
-        table_name: str,
+        data_source: None = None,
+        table_name: str | None = None,
         *,
         greeting: Optional[str | Path] = None,
         client: Optional[str | chatlas.Chat] = None,
         tools: TOOL_GROUPS | tuple[TOOL_GROUPS, ...] | None = ("filter", "query"),
-        data_description: Optional[str | Path] = None,
-        categorical_threshold: int = 20,
+        data_dict: DataDict | str | Path | None = None,
         extra_instructions: Optional[str | Path] = None,
         prompt_template: Optional[str | Path] = None,
+        categorical_threshold: int = 20,
+        data_description: Optional[str | Path] = None,
     ) -> None: ...
 
     @overload
@@ -107,10 +109,11 @@ def __init__(
         greeting: Optional[str | Path] = None,
         client: Optional[str | chatlas.Chat] = None,
         tools: TOOL_GROUPS | tuple[TOOL_GROUPS, ...] | None = ("filter", "query"),
-        data_description: Optional[str | Path] = None,
-        categorical_threshold: int = 20,
+        data_dict: DataDict | str | Path | None = None,
         extra_instructions: Optional[str | Path] = None,
         prompt_template: Optional[str | Path] = None,
+        categorical_threshold: int = 20,
+        data_description: Optional[str | Path] = None,
     ) -> None: ...
 
     @overload
@@ -122,10 +125,11 @@ def __init__(
         greeting: Optional[str | Path] = None,
         client: Optional[str | chatlas.Chat] = None,
         tools: TOOL_GROUPS | tuple[TOOL_GROUPS, ...] | None = ("filter", "query"),
-        data_description: Optional[str | Path] = None,
-        categorical_threshold: int = 20,
+        data_dict: DataDict | str | Path | None = None,
         extra_instructions: Optional[str | Path] = None,
         prompt_template: Optional[str | Path] = None,
+        categorical_threshold: int = 20,
+        data_description: Optional[str | Path] = None,
     ) -> None: ...
 
     @overload
@@ -137,10 +141,11 @@ def __init__(
         greeting: Optional[str | Path] = None,
         client: Optional[str | chatlas.Chat] = None,
         tools: TOOL_GROUPS | tuple[TOOL_GROUPS, ...] | None = ("filter", "query"),
-        data_description: Optional[str | Path] = None,
-        categorical_threshold: int = 20,
+        data_dict: DataDict | str | Path | None = None,
         extra_instructions: Optional[str | Path] = None,
         prompt_template: Optional[str | Path] = None,
+        categorical_threshold: int = 20,
+        data_description: Optional[str | Path] = None,
     ) -> None: ...
 
     @overload
@@ -152,24 +157,26 @@ def __init__(
         greeting: Optional[str | Path] = None,
         client: Optional[str | chatlas.Chat] = None,
         tools: TOOL_GROUPS | tuple[TOOL_GROUPS, ...] | None = ("filter", "query"),
-        data_description: Optional[str | Path] = None,
-        categorical_threshold: int = 20,
+        data_dict: DataDict | str | Path | None = None,
         extra_instructions: Optional[str | Path] = None,
         prompt_template: Optional[str | Path] = None,
+        categorical_threshold: int = 20,
+        data_description: Optional[str | Path] = None,
     ) -> None: ...
 
     def __init__(
         self,
-        data_source: IntoFrame | sqlalchemy.Engine | ibis.Table | None,
-        table_name: str,
+        data_source: IntoFrame | sqlalchemy.Engine | ibis.Table | None = None,
+        table_name: str | None = None,
         *,
         greeting: Optional[str | Path] = None,
         client: Optional[str | chatlas.Chat] = None,
         tools: TOOL_GROUPS | tuple[TOOL_GROUPS, ...] | None = ("filter", "query"),
-        data_description: Optional[str | Path] = None,
-        categorical_threshold: int = 20,
+        data_dict: DataDict | str | Path | None = None,
         extra_instructions: Optional[str | Path] = None,
         prompt_template: Optional[str | Path] = None,
+        categorical_threshold: int = 20,
+        data_description: Optional[str | Path] = None,
     ):
         super().__init__(
             data_source,
@@ -178,6 +185,7 @@ def __init__(
             client=client,
             tools=tools,
             data_description=data_description,
+            data_dict=data_dict,
             categorical_threshold=categorical_threshold,
             extra_instructions=extra_instructions,
             prompt_template=prompt_template,
@@ -247,11 +255,14 @@ def ui(self) -> gr.State:
         >>> app.launch(css=qc.css, head=qc.head)
 
         """
-        data_source = self._require_data_source("ui")
+        self._require_initialized("ui")
         import gradio as gr
 
         initial_state = create_app_state(
-            data_source, self._client_factory, self.greeting
+            data_sources=dict(self._data_sources),
+            client_factory=self._client_factory,
+            greeting=self.greeting,
+            query_executor=self._require_query_executor("ui"),
         )
 
         state_holder = gr.State(value=initial_state.to_dict())
@@ -328,12 +339,12 @@ def app(self) -> GradioBlocksWrapper:
             querychat CSS/JS at launch time for Gradio 6.0+ compatibility.
 
         """
-        data_source = self._require_data_source("app")
+        self._require_initialized("app")
         from gradio.themes import Soft
 
         import gradio as gr
 
-        table_name = data_source.table_name
+        table_name = next(iter(self._data_sources))
 
         with gr.Blocks(
             title=f"querychat with {table_name}",
@@ -368,17 +379,14 @@ def app(self) -> GradioBlocksWrapper:
 
             def update_displays(state_dict: AppStateDict):
                 """Update SQL and data displays based on state."""
-                title = state_dict.get("title") if state_dict else None
-                error = state_dict.get("error") if state_dict else None
+                state = self._deserialize_state(state_dict)
+                df = state.get_current_data()
+                title = state.title
+                error = state.error
 
                 sql_title_text = f"### {title or 'SQL Query'}"
-                sql_code = (
-                    state_dict.get("sql")
-                    if state_dict and state_dict.get("sql")
-                    else f"SELECT * FROM {table_name}"
-                )
+                sql_code = state.get_display_sql()
 
-                df = self.df(state_dict)
                 nw_df = as_narwhals(df)
                 nrow, ncol = nw_df.shape
                 native_df = nw_df.to_native()
diff --git a/pkg-py/src/querychat/_icons.py b/pkg-py/src/querychat/_icons.py
index fc484c9c0..25cabdf00 100644
--- a/pkg-py/src/querychat/_icons.py
+++ b/pkg-py/src/querychat/_icons.py
@@ -9,6 +9,7 @@
     "download",
     "funnel-fill",
     "graph-up",
+    "search",
     "terminal-fill",
     "table",
 ]
@@ -30,6 +31,7 @@ def bs_icon(name: ICON_NAMES, cls: str = "") -> ui.HTML:
     "chevron-down": '<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 16 16" class="bi bi-chevron-down" style="height:1em;width:1em;fill:currentColor;vertical-align:-0.125em;" aria-hidden="true" role="img"><path fill-rule="evenodd" d="M1.646 4.646a.5.5 0 0 1 .708 0L8 10.293l5.646-5.647a.5.5 0 0 1 .708.708l-6 6a.5.5 0 0 1-.708 0l-6-6a.5.5 0 0 1 0-.708"/></svg>',
     "download": '<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 16 16" class="bi bi-download" style="height:1em;width:1em;fill:currentColor;vertical-align:-0.125em;" aria-hidden="true" role="img"><path d="M.5 9.9a.5.5 0 0 1 .5.5v2.5a1 1 0 0 0 1 1h12a1 1 0 0 0 1-1v-2.5a.5.5 0 0 1 1 0v2.5a2 2 0 0 1-2 2H2a2 2 0 0 1-2-2v-2.5a.5.5 0 0 1 .5-.5"/><path d="M7.646 11.854a.5.5 0 0 0 .708 0l3-3a.5.5 0 0 0-.708-.708L8.5 10.293V1.5a.5.5 0 0 0-1 0v8.793L5.354 8.146a.5.5 0 1 0-.708.708z"/></svg>',
     "funnel-fill": '<svg xmlns="http://www.w3.org/2000/svg" width="16" height="16" fill="currentColor" class="bi bi-funnel-fill" viewBox="0 0 16 16"><path d="M1.5 1.5A.5.5 0 0 1 2 1h12a.5.5 0 0 1 .5.5v2a.5.5 0 0 1-.128.334L10 8.692V13.5a.5.5 0 0 1-.342.474l-3 1A.5.5 0 0 1 6 14.5V8.692L1.628 3.834A.5.5 0 0 1 1.5 3.5z"/></svg>',
+    "search": '<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 16 16" class="bi bi-search" style="height:1em;width:1em;fill:currentColor;vertical-align:-0.125em;" aria-hidden="true" role="img"><path d="M11.742 10.344a6.5 6.5 0 1 0-1.397 1.398h-.001q.044.06.098.115l3.85 3.85a1 1 0 0 0 1.415-1.414l-3.85-3.85a1 1 0 0 0-.115-.099M12 6.5a5.5 5.5 0 1 1-11 0 5.5 5.5 0 0 1 11 0"/></svg>',
     "graph-up": '<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 16 16" class="bi bi-graph-up" style="height:1em;width:1em;fill:currentColor;vertical-align:-0.125em;" aria-hidden="true" role="img"><path fill-rule="evenodd" d="M0 0h1v15h15v1H0zm14.817 3.113a.5.5 0 0 1 .07.704l-4.5 5.5a.5.5 0 0 1-.74.037L7.06 6.767l-3.656 5.027a.5.5 0 0 1-.808-.588l4-5.5a.5.5 0 0 1 .758-.06l2.609 2.61 4.15-5.073a.5.5 0 0 1 .704-.07"/></svg>',
     "terminal-fill": '<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 16 16" class="bi bi-terminal-fill " style="height:1em;width:1em;fill:currentColor;vertical-align:-0.125em;" aria-hidden="true" role="img" ><path d="M0 3a2 2 0 0 1 2-2h12a2 2 0 0 1 2 2v10a2 2 0 0 1-2 2H2a2 2 0 0 1-2-2V3zm9.5 5.5h-3a.5.5 0 0 0 0 1h3a.5.5 0 0 0 0-1zm-6.354-.354a.5.5 0 1 0 .708.708l2-2a.5.5 0 0 0 0-.708l-2-2a.5.5 0 1 0-.708.708L4.793 6.5 3.146 8.146z"></path></svg>',
     "table": '<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 16 16" class="bi bi-table " style="height:1em;width:1em;fill:currentColor;vertical-align:-0.125em;" aria-hidden="true" role="img" ><path d="M0 2a2 2 0 0 1 2-2h12a2 2 0 0 1 2 2v12a2 2 0 0 1-2 2H2a2 2 0 0 1-2-2V2zm15 2h-4v3h4V4zm0 4h-4v3h4V8zm0 4h-4v3h3a1 1 0 0 0 1-1v-2zm-5 3v-3H6v3h4zm-5 0v-3H1v2a1 1 0 0 0 1 1h3zm-4-4h4V8H1v3zm0-4h4V4H1v3zm5-3v3h4V4H6zm4 4H6v3h4V8z"></path></svg>',
diff --git a/pkg-py/src/querychat/_pin_source.py b/pkg-py/src/querychat/_pin_source.py
index 58240f8cb..fd62ae9ef 100644
--- a/pkg-py/src/querychat/_pin_source.py
+++ b/pkg-py/src/querychat/_pin_source.py
@@ -7,10 +7,13 @@
 import narwhals.stable.v1 as nw
 
 from ._datasource import (
+    ColumnMeta,
     DataSource,
     MissingColumnsError,
-    duckdb_get_schema,
+    duckdb_column_meta,
+    duckdb_column_stats,
     duckdb_lock_down,
+    format_schema,
 )
 from ._utils import check_query
 
@@ -186,7 +189,18 @@ def get_db_type(self) -> str:
         return "DuckDB"
 
     def get_schema(self, *, categorical_threshold: int) -> str:
-        return duckdb_get_schema(self._conn, self.table_name, categorical_threshold)
+        metas = self.get_column_metas()
+        self.populate_column_stats(metas, categorical_threshold)
+        return format_schema(self.table_name, metas)
+
+    def get_column_metas(self) -> list[ColumnMeta]:
+        result = self._conn.execute(f'SELECT * FROM "{self.table_name}" LIMIT 0')
+        return [duckdb_column_meta(desc[0], desc[1]) for desc in result.description]
+
+    def populate_column_stats(
+        self, columns: list[ColumnMeta], categorical_threshold: int
+    ) -> None:
+        duckdb_column_stats(self._conn, self.table_name, columns, categorical_threshold)
 
     def execute_query(self, query: str) -> nw.DataFrame:
         check_query(query)
diff --git a/pkg-py/src/querychat/_query_executor.py b/pkg-py/src/querychat/_query_executor.py
new file mode 100644
index 000000000..ab5a46b02
--- /dev/null
+++ b/pkg-py/src/querychat/_query_executor.py
@@ -0,0 +1,306 @@
+"""QueryExecutor abstraction for cross-table query execution."""
+
+from __future__ import annotations
+
+from abc import ABC, abstractmethod
+from typing import TYPE_CHECKING, Any
+
+import duckdb
+import narwhals.stable.v1 as nw
+
+from ._datasource import (
+    ColumnMeta,
+    MissingColumnsError,
+    duckdb_column_meta,
+    duckdb_column_stats,
+    duckdb_lock_down,
+    format_schema,
+)
+from ._utils import check_query
+
+if TYPE_CHECKING:
+    from ._datasource import DataFrameSource, DataSource, PolarsLazySource
+
+
+class QueryExecutor(ABC):
+    """Thin abstraction that tools use for query execution and validation."""
+
+    @abstractmethod
+    def execute_query(self, query: str) -> Any: ...
+
+    @abstractmethod
+    def test_query(
+        self, query: str, *, table_name: str, require_all_columns: bool = False
+    ) -> None: ...
+
+    @abstractmethod
+    def get_db_type(self) -> str: ...
+
+    @abstractmethod
+    def cleanup(self) -> None: ...
+
+    @abstractmethod
+    def get_column_metas(self, table_name: str) -> list[ColumnMeta]: ...
+
+    @abstractmethod
+    def populate_column_stats(
+        self, table_name: str, columns: list[ColumnMeta], categorical_threshold: int
+    ) -> None: ...
+
+    def get_column_details(self, table_name: str, categorical_threshold: int) -> list[ColumnMeta]:
+        metas = self.get_column_metas(table_name)
+        self.populate_column_stats(table_name, metas, categorical_threshold)
+        return metas
+
+    def get_schema(self, table_name: str, categorical_threshold: int) -> str:
+        return format_schema(table_name, self.get_column_details(table_name, categorical_threshold))
+
+    @staticmethod
+    def _validate_missing_columns(
+        result_columns: set[str], expected_columns: list[str]
+    ) -> None:
+        missing = set(expected_columns) - result_columns
+        if missing:
+            missing_list = ", ".join(f"'{c}'" for c in sorted(missing))
+            original_list = ", ".join(f"'{c}'" for c in expected_columns)
+            raise MissingColumnsError(
+                f"Query result missing required columns: {missing_list}. "
+                f"The query must return all original table columns. "
+                f"Original columns: {original_list}"
+            )
+
+
+class DuckDBExecutor(QueryExecutor):
+    """Shared DuckDB connection for multi-table DataFrameSource queries."""
+
+    def __init__(self, sources: dict[str, DataFrameSource]):
+        self._df_lib = get_shared_dataframe_backend(sources)
+        self._conn = duckdb.connect(database=":memory:")
+
+        for name, source in sources.items():
+            self._conn.register(name, source.get_data())
+
+        # Cache column names per table before lockdown
+        self._table_columns: dict[str, list[str]] = {}
+        for name in sources:
+            result = self._conn.execute(f'SELECT * FROM "{name}" LIMIT 0')
+            self._table_columns[name] = [desc[0] for desc in result.description]
+
+        duckdb_lock_down(self._conn)
+
+    def execute_query(self, query: str) -> Any:
+        check_query(query)
+        result = self._conn.execute(query)
+        return self._convert_result(result)
+
+    def _convert_result(self, result: duckdb.DuckDBPyConnection) -> Any:
+        if self._df_lib == "polars":
+            return result.pl()
+        elif self._df_lib == "pandas":
+            return result.df()
+        elif self._df_lib == "pyarrow":
+            return result.fetch_arrow_table()
+        else:
+            raise ValueError(
+                f"Unsupported DataFrame backend: '{self._df_lib}'. "
+                "Supported backends are: polars, pandas, pyarrow"
+            )
+
+    def test_query(
+        self, query: str, *, table_name: str, require_all_columns: bool = False
+    ) -> None:
+        check_query(query)
+        result = self._conn.execute(f"{query} LIMIT 1")
+
+        if require_all_columns:
+            result_columns = {desc[0] for desc in result.description}
+            self._validate_missing_columns(result_columns, self._table_columns[table_name])
+
+    def get_db_type(self) -> str:
+        return "DuckDB"
+
+    def cleanup(self) -> None:
+        if self._conn:
+            self._conn.close()
+
+    def get_column_metas(self, table_name: str) -> list[ColumnMeta]:
+        result = self._conn.execute(f'SELECT * FROM "{table_name}" LIMIT 0')
+        return [duckdb_column_meta(desc[0], desc[1]) for desc in result.description]
+
+    def populate_column_stats(
+        self, table_name: str, columns: list[ColumnMeta], categorical_threshold: int
+    ) -> None:
+        duckdb_column_stats(self._conn, table_name, columns, categorical_threshold)
+
+
+class PolarsSQLExecutor(QueryExecutor):
+    """Shared Polars SQLContext for multi-table PolarsLazySource queries."""
+
+    def __init__(self, sources: dict[str, PolarsLazySource]):
+        import polars as pl
+
+        frames = {name: source.get_data() for name, source in sources.items()}
+        self._ctx = pl.SQLContext(frames)
+        self._sources = sources  # stored for schema delegation
+
+        self._table_columns: dict[str, list[str]] = {}
+        for name, source in sources.items():
+            self._table_columns[name] = list(source.get_data().collect_schema().keys())
+
+    def execute_query(self, query: str) -> Any:
+        check_query(query)
+        return self._ctx.execute(query)
+
+    def test_query(
+        self, query: str, *, table_name: str, require_all_columns: bool = False
+    ) -> None:
+        check_query(query)
+        test_lf = self._ctx.execute(f"SELECT * FROM ({query}) AS subquery LIMIT 1")
+        test_lf.collect()
+
+        if require_all_columns:
+            full_lf = self._ctx.execute(query)
+            result_columns = set(full_lf.collect_schema().keys())
+            self._validate_missing_columns(result_columns, self._table_columns[table_name])
+
+    def get_db_type(self) -> str:
+        return "Polars"
+
+    def cleanup(self) -> None:
+        pass
+
+    def get_column_metas(self, table_name: str) -> list[ColumnMeta]:
+        return self._sources[table_name].get_column_metas()
+
+    def populate_column_stats(
+        self, table_name: str, columns: list[ColumnMeta], categorical_threshold: int
+    ) -> None:
+        self._sources[table_name].populate_column_stats(columns, categorical_threshold)
+
+
+class DataSourceExecutor(QueryExecutor):
+    """
+    Wraps existing DataSource(s) for backends that already share a connection.
+
+    Used for single-table mode (any source type) and multi-table SQLAlchemy/Ibis
+    where all sources share the same database backend.
+    """
+
+    def __init__(self, data_sources: dict[str, DataSource]):
+        validate_source_group_compatibility(data_sources)
+        self._data_sources = data_sources
+        self._primary = next(iter(data_sources.values()))
+
+    def execute_query(self, query: str) -> Any:
+        return self._primary.execute_query(query)
+
+    def test_query(
+        self, query: str, *, table_name: str, require_all_columns: bool = False
+    ) -> None:
+        self._data_sources[table_name].test_query(
+            query, require_all_columns=require_all_columns
+        )
+
+    def get_db_type(self) -> str:
+        return self._primary.get_db_type()
+
+    def cleanup(self) -> None:
+        pass
+
+    def get_column_metas(self, table_name: str) -> list[ColumnMeta]:
+        return self._data_sources[table_name].get_column_metas()
+
+    def populate_column_stats(
+        self, table_name: str, columns: list[ColumnMeta], categorical_threshold: int
+    ) -> None:
+        self._data_sources[table_name].populate_column_stats(columns, categorical_threshold)
+
+
+def get_shared_dataframe_backend(sources: dict[str, DataFrameSource]) -> str:
+    """Return the shared backend name, rejecting mixed DataFrameSource backends."""
+    source_items = iter(sources.items())
+    _, first_source = next(source_items)
+    shared_lib = get_dataframe_backend_name(first_source)
+
+    for name, source in source_items:
+        source_lib = get_dataframe_backend_name(source)
+        if source_lib != shared_lib:
+            raise ValueError(
+                f"Cannot add table '{name}': all DataFrameSources must use "
+                f"the same DataFrame backend. "
+                f"Existing tables use {shared_lib}, new table uses {source_lib}."
+            )
+
+    return shared_lib
+
+
+def validate_source_group_compatibility(data_sources: dict[str, DataSource]) -> None:
+    """Validate that a group of sources satisfies shared executor constraints."""
+    existing: dict[str, DataSource] = {}
+    for name, source in data_sources.items():
+        check_source_compatibility(existing, source, name)
+        existing[name] = source
+
+
+def check_source_compatibility(
+    existing: dict[str, DataSource],
+    new_source: DataSource,
+    new_name: str,
+) -> None:
+    """Validate that a new source is compatible with existing sources."""
+    if not existing:
+        return
+
+    from ._datasource import (
+        DataFrameSource,
+        IbisSource,
+        SQLAlchemySource,
+    )
+
+    first_source = next(iter(existing.values()))
+
+    if type(new_source) is not type(first_source):
+        raise ValueError(
+            f"Cannot add {type(new_source).__name__} table '{new_name}': "
+            f"all tables must be the same type. "
+            f"Existing tables use {type(first_source).__name__}."
+        )
+
+    if isinstance(new_source, DataFrameSource) and isinstance(
+        first_source, DataFrameSource
+    ):
+        new_lib = get_dataframe_backend_name(new_source)
+        existing_lib = get_dataframe_backend_name(first_source)
+        if new_lib != existing_lib:
+            raise ValueError(
+                f"Cannot add table '{new_name}': all DataFrameSources must use "
+                f"the same DataFrame backend. "
+                f"Existing tables use {existing_lib}, new table uses {new_lib}."
+            )
+
+    if (
+        isinstance(new_source, SQLAlchemySource)
+        and isinstance(first_source, SQLAlchemySource)
+        and new_source.engine is not first_source.engine
+    ):
+        raise ValueError(
+            f"Cannot add table '{new_name}': all SQLAlchemy tables must "
+            f"share the same Engine instance."
+        )
+
+    if (
+        isinstance(new_source, IbisSource)
+        and isinstance(first_source, IbisSource)
+        and new_source.backend is not first_source.backend
+    ):
+        raise ValueError(
+            f"Cannot add table '{new_name}': all Ibis tables must "
+            f"share the same backend instance."
+        )
+
+
+def get_dataframe_backend_name(source: DataFrameSource) -> str:
+    """Return the native eager dataframe backend name for a DataFrameSource."""
+    return nw.get_native_namespace(
+        nw.from_native(source.get_data(), eager_only=True)
+    ).__name__
diff --git a/pkg-py/src/querychat/_querychat_base.py b/pkg-py/src/querychat/_querychat_base.py
index feaf3a45d..782660ff8 100644
--- a/pkg-py/src/querychat/_querychat_base.py
+++ b/pkg-py/src/querychat/_querychat_base.py
@@ -2,9 +2,11 @@
 
 from __future__ import annotations
 
+import contextlib
 import copy
 import os
 import re
+import warnings
 from pathlib import Path
 from typing import TYPE_CHECKING, Generic, Literal, Optional
 
@@ -21,12 +23,28 @@
     SQLAlchemySource,
 )
 from ._pin_source import PinSource, is_pins_board
-from ._querychat_core import GREETING_PROMPT
+from ._query_executor import (
+    DataSourceExecutor,
+    DuckDBExecutor,
+    PolarsSQLExecutor,
+    QueryExecutor,
+    check_source_compatibility,
+    validate_source_group_compatibility,
+)
+from ._querychat_core import (
+    GREETING_PROMPT,
+    AppState,
+    AppStateDict,
+    create_app_state,
+    warn_multi_table_flat_accessor,
+)
 from ._system_prompt import QueryChatSystemPrompt
 from ._utils import MISSING, MISSING_TYPE, is_ibis_table
 from ._viz_utils import has_viz_deps, has_viz_tool
 from .tools import (
+    ResetDashboardCallback,
     UpdateDashboardData,
+    tool_get_schema,
     tool_query,
     tool_reset_dashboard,
     tool_update_dashboard,
@@ -39,6 +57,7 @@
     from narwhals.stable.v1.typing import IntoFrame
     from pins.boards import BaseBoard
 
+    from ._data_dict import DataDict
     from ._viz_tools import VisualizeData
 
 TOOL_GROUPS = Literal["filter", "update", "query", "visualize"]
@@ -59,36 +78,26 @@ class QueryChatBase(Generic[IntoFrameT]):
 
     def __init__(
         self,
-        data_source: IntoFrame | sqlalchemy.Engine | BaseBoard | None,
+        data_source: IntoFrame | sqlalchemy.Engine | BaseBoard | None = None,
         table_name: str | None = None,
         *,
         greeting: Optional[str | Path] = None,
         client: Optional[str | chatlas.Chat] = None,
         tools: TOOL_GROUPS | tuple[TOOL_GROUPS, ...] | None = DEFAULT_TOOLS,
-        data_description: Optional[str | Path] = None,
-        categorical_threshold: int = 20,
+        data_dict: DataDict | str | Path | list[DataDict | str | Path] | None = None,
         extra_instructions: Optional[str | Path] = None,
         prompt_template: Optional[str | Path] = None,
+        categorical_threshold: int = 20,
+        data_description: Optional[str | Path] = None,
     ):
-        if table_name is None:
-            if isinstance(data_source, DataSource):
-                table_name = data_source.table_name
-            elif data_source is not None:
-                raise ValueError(
-                    "table_name is required when data_source is not a DataSource"
-                )
+        self._data_dicts: list[DataDict] = _normalize_data_dicts(data_dict)
 
-        # Store table_name for later normalization
-        self._table_name = table_name
+        # Multi-table storage: dict of data sources keyed by table name
+        self._data_sources: dict[str, DataSource] = {}
+        self._query_executor: QueryExecutor | None = None
 
-        if (
-            table_name is not None
-            and not is_pins_board(data_source)
-            and not re.match(r"^[a-zA-Z][a-zA-Z0-9_]*$", table_name)
-        ):
-            raise ValueError(
-                "Table name must begin with a letter and contain only letters, numbers, and underscores",
-            )
+        # Track server initialization state for add/remove table validation
+        self._server_initialized = False
 
         self.tools = normalize_tools(tools, default=DEFAULT_TOOLS)
         self.greeting = greeting.read_text() if isinstance(greeting, Path) else greeting
@@ -96,66 +105,109 @@ def __init__(
         # Store init parameters for deferred system prompt building
         self._prompt_template = prompt_template
         self._data_description = data_description
-        self._data_description_mode: Literal["supplied", "inferred", "empty"] = (
-            "supplied" if data_description is not None else "empty"
-        )
         self._extra_instructions = extra_instructions
         self._categorical_threshold = categorical_threshold
 
         self._client_spec: str | chatlas.Chat | None = client
         self._client_console = None
 
-        # Initialize data source (may be None for deferred pattern)
+        self._system_prompt: QueryChatSystemPrompt | None = None
+
         if data_source is not None:
             if table_name is None:
-                raise ValueError("table_name is required when data_source is provided")
-            self._data_source: DataSource | None = normalize_data_source(
-                data_source, table_name
-            )
-            self._table_name = self._data_source.table_name
-            self._auto_fill_data_description()
-            self._build_system_prompt()
-        else:
-            self._data_source = None
-            self._system_prompt = None
-
-    def _auto_fill_data_description(self) -> None:
-        """Auto-populate data_description from data source metadata if not user-supplied."""
-        if self._data_description_mode == "inferred":
-            self._data_description = None
-            self._data_description_mode = "empty"
-        if self._data_description_mode == "empty" and self._data_source is not None:
-            desc = self._data_source.get_data_description()
-            if desc:
-                self._data_description = desc
-                self._data_description_mode = "inferred"
-
-    def _build_system_prompt(self) -> None:
-        """Build/rebuild the system prompt from current data source."""
-        if self._data_source is None:
+                if isinstance(data_source, DataSource):
+                    table_name = data_source.table_name
+                else:
+                    raise ValueError(
+                        "table_name is required when data_source is provided"
+                    )
+            self.add_table(data_source, table_name)
+
+    def _build_system_prompt(
+        self,
+        *,
+        data_sources: dict[str, DataSource] | None = None,
+    ) -> None:
+        """Build/rebuild the system prompt from current or staged data sources."""
+        next_data_sources = self._data_sources if data_sources is None else data_sources
+
+        if not next_data_sources:
             raise RuntimeError("Cannot build system prompt without data_source")
 
-        prompt_template = self._prompt_template
-        if prompt_template is None:
-            prompt_template = Path(__file__).parent / "prompts" / "prompt.md"
+        client_has_history = (
+            isinstance(self._client_spec, chatlas.Chat) and bool(self._client_spec.get_turns())
+        ) or (
+            self._client_console is not None and bool(self._client_console.get_turns())
+        )
+        if client_has_history:
+            warnings.warn(
+                "System prompt rebuilt after chat history exists. "
+                "This invalidates any prompt caching from prior turns. "
+                "Configure all tables before starting a conversation.",
+                UserWarning,
+                stacklevel=3,
+            )
 
         self._system_prompt = QueryChatSystemPrompt(
-            prompt_template=prompt_template,
-            data_source=self._data_source,
+            prompt_template=self._prompt_template,
+            data_sources=next_data_sources,
             data_description=self._data_description,
             extra_instructions=self._extra_instructions,
             categorical_threshold=self._categorical_threshold,
+            data_dicts=self._data_dicts,
         )
 
-    def _require_data_source(self, method_name: str) -> DataSource[IntoFrameT]:
-        """Raise if data_source is not set, otherwise return it for type narrowing."""
-        if self._data_source is None:
+    def _build_query_executor(
+        self, *, data_sources: dict[str, DataSource] | None = None
+    ) -> QueryExecutor:
+        """Build a query executor from current or staged data sources."""
+        sources = self._data_sources if data_sources is None else data_sources
+
+        validate_source_group_compatibility(sources)
+
+        if len(sources) == 1:
+            return DataSourceExecutor(dict(sources))
+
+        first_source = next(iter(sources.values()))
+
+        if isinstance(first_source, DataFrameSource):
+            return DuckDBExecutor(
+                {n: s for n, s in sources.items() if isinstance(s, DataFrameSource)}
+            )
+        if isinstance(first_source, PolarsLazySource):
+            return PolarsSQLExecutor(
+                {n: s for n, s in sources.items() if isinstance(s, PolarsLazySource)}
+            )
+
+        return DataSourceExecutor(dict(sources))
+
+    def _require_initialized(self, method_name: str) -> None:
+        """Raise if no data sources have been registered."""
+        if not self._data_sources:
             raise RuntimeError(
-                f"data_source must be set before calling {method_name}(). "
-                "Either pass data_source to __init__(), set the data_source property, "
-                "or pass data_source to server()."
+                f"At least one data source must be set before calling {method_name}(). "
+                "Either pass data_source to __init__() or call add_table()."
+            )
+
+    def _require_single_table(self, method_name: str) -> None:
+        """Raise if multiple tables are registered, directing to per-table API."""
+        if len(self._data_sources) > 1:
+            table_list = ", ".join(f"'{n}'" for n in self._data_sources)
+            raise AttributeError(
+                f"Cannot use .{method_name}() with multiple tables ({table_list}). "
+                f"Use .table('name').{method_name}() for per-table access."
             )
-        return self._data_source
+
+    def _require_query_executor(self, method_name: str) -> QueryExecutor:
+        """Return the cached executor, building it lazily on first use."""
+        if self._query_executor is None:
+            if not self._data_sources:
+                raise RuntimeError(
+                    f"query executor must be set before calling {method_name}(). "
+                    "Set the data_source first so querychat can build an executor."
+                )
+            self._query_executor = self._build_query_executor()
+        return self._query_executor
 
     def _create_session_client(
         self,
@@ -163,7 +215,7 @@ def _create_session_client(
         client_spec: str | chatlas.Chat | None | MISSING_TYPE = MISSING,
         tools: TOOL_GROUPS | tuple[TOOL_GROUPS, ...] | None | MISSING_TYPE = MISSING,
         update_dashboard: Callable[[UpdateDashboardData], None] | None = None,
-        reset_dashboard: Callable[[], None] | None = None,
+        reset_dashboard: ResetDashboardCallback | None = None,
         visualize: Callable[[VisualizeData], None] | None = None,
     ) -> chatlas.Chat:
         """Create a fresh, fully-configured Chat."""
@@ -178,20 +230,44 @@ def _create_session_client(
         if resolved_tools is None:
             return chat
 
-        data_source = self._require_data_source("_create_session_client")
+        executor = self._require_query_executor("_create_session_client")
+
+        # Always register the schema tool (for all non-None tool sets)
+        chat.register_tool(
+            tool_get_schema(
+                self._data_dicts,
+                executor,
+                list(self._data_sources.keys()),
+                self._categorical_threshold,
+            )
+        )
 
         if "update" in resolved_tools:
             update_fn = update_dashboard or (lambda _: None)
-            reset_fn = reset_dashboard or (lambda: None)
-            chat.register_tool(tool_update_dashboard(data_source, update_fn))
-            chat.register_tool(tool_reset_dashboard(reset_fn))
+            user_reset = reset_dashboard or (lambda _table: None)
+
+            chat.register_tool(
+                tool_update_dashboard(
+                    executor,
+                    list(self._data_sources.keys()),
+                    update_fn,
+                    multi_table=len(self._data_sources) > 1,
+                )
+            )
+            chat.register_tool(
+                tool_reset_dashboard(user_reset, list(self._data_sources.keys()))
+            )
 
         if "query" in resolved_tools:
-            chat.register_tool(tool_query(data_source))
+            chat.register_tool(
+                tool_query(executor, multi_table=len(self._data_sources) > 1)
+            )
 
         if "visualize" in resolved_tools:
             viz_fn = visualize or (lambda _: None)
-            chat.register_tool(tool_visualize(data_source, viz_fn))
+            chat.register_tool(
+                tool_visualize(executor, viz_fn, multi_table=len(self._data_sources) > 1)
+            )
 
         return chat
 
@@ -200,7 +276,7 @@ def client(
         *,
         tools: TOOL_GROUPS | tuple[TOOL_GROUPS, ...] | None | MISSING_TYPE = MISSING,
         update_dashboard: Callable[[UpdateDashboardData], None] | None = None,
-        reset_dashboard: Callable[[], None] | None = None,
+        reset_dashboard: ResetDashboardCallback | None = None,
         visualize: Callable[[VisualizeData], None] | None = None,
     ) -> chatlas.Chat:
         """
@@ -225,7 +301,7 @@ def client(
             A configured chat client.
 
         """
-        self._require_data_source("client")
+        self._require_initialized("client")
         return self._create_session_client(
             tools=tools,
             update_dashboard=update_dashboard,
@@ -235,7 +311,7 @@ def client(
 
     def generate_greeting(self, *, echo: Literal["none", "output"] = "none") -> str:
         """Generate a welcome greeting for the chat."""
-        self._require_data_source("generate_greeting")
+        self._require_initialized("generate_greeting")
         chat = create_client(self._client_spec)
         if self._system_prompt is not None:
             chat.system_prompt = self._system_prompt.render(self.tools)
@@ -249,7 +325,7 @@ def console(
         **kwargs,
     ) -> None:
         """Launch an interactive console chat with the data."""
-        self._require_data_source("console")
+        self._require_initialized("console")
         if new or self._client_console is None:
             self._client_console = self.client(tools=tools, **kwargs)
 
@@ -258,32 +334,268 @@ def console(
     @property
     def system_prompt(self) -> str:
         """Get the system prompt."""
-        self._require_data_source("system_prompt")
+        self._require_initialized("system_prompt")
         if self._system_prompt is None:
             raise RuntimeError("System prompt not initialized")
         return self._system_prompt.render(self.tools)
 
     @property
-    def data_source(self) -> DataSource | None:
-        """Get the current data source."""
-        return self._data_source
+    def data_source(self) -> DataSource:
+        """Removed. Use ``add_table()`` and ``remove_table()`` to manage tables."""
+        raise AttributeError(
+            "The .data_source property has been removed. "
+            "Use qc.add_table(df, 'name') to add a new table, "
+            "or qc.add_table(df, 'name', replace=True) to replace an existing one."
+        )
 
     @data_source.setter
-    def data_source(self, value: IntoFrame | sqlalchemy.Engine | BaseBoard) -> None:
-        """Set the data source, normalizing and rebuilding system prompt."""
-        old_source = self._data_source
-        if self._table_name is None:
-            raise ValueError("table_name must be set before assigning a data source")
-        self._data_source = normalize_data_source(value, self._table_name)
-        if old_source is not None and old_source is not self._data_source:
+    def data_source(self, _value: object) -> None:
+        raise AttributeError(
+            "The .data_source setter has been removed. "
+            "Use qc.add_table(df, 'name') to add a new table, "
+            "or qc.add_table(df, 'name', replace=True) to replace an existing one."
+        )
+
+    def table_names(self) -> list[str]:
+        """
+        Return the names of all registered tables.
+
+        Returns
+        -------
+        list[str]
+            List of table names in the order they were added.
+
+        """
+        return list(self._data_sources.keys())
+
+    def add_table(
+        self,
+        data_source: IntoFrame | sqlalchemy.Engine | BaseBoard,
+        table_name: str,
+        *,
+        replace: bool = False,
+    ) -> None:
+        """
+        Add or replace a table in the QueryChat instance.
+
+        Parameters
+        ----------
+        data_source
+            The data source (DataFrame, LazyFrame, database connection, or pins board).
+        table_name
+            Name for the table.
+        replace
+            If True, replace an existing table with the same name.
+            If False (default), raise ValueError if the table already exists.
+
+        Raises
+        ------
+        ValueError
+            If table_name already exists (and replace=False) or is invalid.
+        RuntimeError
+            If called after server() has been invoked.
+
+        """
+        if self._server_initialized:
+            raise RuntimeError(
+                "Cannot add tables after server initialization. "
+                "Add all tables before calling .server() or .app()."
+            )
+
+        if not is_pins_board(data_source) and not re.match(
+            r"^[a-zA-Z][a-zA-Z0-9_]*$", table_name
+        ):
+            raise ValueError(
+                "Table name must begin with a letter and contain only "
+                "letters, numbers, and underscores"
+            )
+
+        if table_name in self._data_sources and not replace:
+            raise ValueError(f"Table '{table_name}' already exists")
+
+        normalized = normalize_data_source(data_source, table_name)
+        try:
+            other_sources = {
+                name: source
+                for name, source in self._data_sources.items()
+                if name != table_name
+            }
+            check_source_compatibility(other_sources, normalized, table_name)
+            next_data_sources = dict(self._data_sources)
+            next_data_sources[table_name] = normalized
+
+            self._build_system_prompt(data_sources=next_data_sources)
+        except Exception:
+            cleanup_failed_staged_source(data_source, normalized)
+            raise
+
+        old_source = self._data_sources.get(table_name)
+        self._data_sources = next_data_sources
+        if old_source is not None and old_source is not normalized:
             old_source.cleanup()
-        self._auto_fill_data_description()
-        self._build_system_prompt()
+        if self._query_executor is not None:
+            with contextlib.suppress(Exception):
+                self._query_executor.cleanup()
+            self._query_executor = None
+
+    def add_tables(
+        self,
+        data_source: sqlalchemy.Engine,
+        tables: list[str] | None = None,
+        *,
+        replace: bool = False,
+    ) -> None:
+        """
+        Add multiple tables from a SQLAlchemy engine in a single call.
+
+        Unlike calling :meth:`add_table` repeatedly, this method builds the
+        system prompt exactly once after all tables have been staged, avoiding
+        N-1 spurious intermediate rebuilds.
+
+        Parameters
+        ----------
+        data_source
+            A SQLAlchemy engine. Only engines are supported; pass individual
+            DataFrames or other sources via :meth:`add_table`.
+        tables
+            Table names to register. When ``None``, all tables returned by
+            ``sqlalchemy.inspect(data_source).get_table_names()`` are used.
+        replace
+            If ``True``, replace any existing table whose name appears in
+            ``tables``. If ``False`` (default), raise ``ValueError`` if any
+            name already exists.
+
+        Raises
+        ------
+        TypeError
+            If ``data_source`` is not a ``sqlalchemy.Engine``.
+        ValueError
+            If the resolved table list is empty, any name is invalid, or any
+            name already exists (and ``replace=False``).
+        RuntimeError
+            If called after :meth:`server` has been invoked.
+
+        Examples
+        --------
+        Register all tables from an engine:
+
+        >>> qc = QueryChat()
+        >>> qc.add_tables(engine)
+
+        Register a specific subset:
+
+        >>> qc.add_tables(engine, ["orders", "customers"])
+
+        """
+        if self._server_initialized:
+            raise RuntimeError(
+                "Cannot add tables after server initialization. "
+                "Add all tables before calling .server() or .app()."
+            )
+
+        if not isinstance(data_source, sqlalchemy.Engine):
+            raise TypeError(
+                f"add_tables() requires a sqlalchemy.Engine, got {type(data_source).__name__}. "
+                "Use add_table() for DataFrames and other source types."
+            )
+
+        if tables is None:
+            tables = sqlalchemy.inspect(data_source).get_table_names()
+
+        if not tables:
+            raise ValueError("No tables found in database")
+
+        for table_name in tables:
+            if not re.match(r"^[a-zA-Z][a-zA-Z0-9_]*$", table_name):
+                raise ValueError(
+                    "Table name must begin with a letter and contain only "
+                    "letters, numbers, and underscores"
+                )
+            if table_name in self._data_sources and not replace:
+                raise ValueError(f"Table '{table_name}' already exists")
+
+        normalized = {
+            name: normalize_data_source(data_source, name) for name in tables
+        }
+
+        staged: dict[str, DataSource] = {}
+        for name, source in normalized.items():
+            other_sources = {
+                n: s
+                for n, s in self._data_sources.items()
+                if n != name
+            }
+            check_source_compatibility({**other_sources, **staged}, source, name)
+            staged[name] = source
+
+        next_data_sources = {**self._data_sources, **normalized}
+        self._build_system_prompt(data_sources=next_data_sources)
+
+        for name, normalized_source in normalized.items():
+            old_source = self._data_sources.get(name)
+            if old_source is not None and old_source is not normalized_source:
+                old_source.cleanup()
+
+        self._data_sources = next_data_sources
+        if self._query_executor is not None:
+            with contextlib.suppress(Exception):
+                self._query_executor.cleanup()
+            self._query_executor = None
+
+    def remove_table(self, table_name: str) -> None:
+        """
+        Remove a table from the QueryChat instance.
+
+        Parameters
+        ----------
+        table_name
+            Name of the table to remove.
+
+        Raises
+        ------
+        ValueError
+            If table doesn't exist or is the last remaining table.
+        RuntimeError
+            If called after server() has been invoked.
+
+        """
+        if self._server_initialized:
+            raise RuntimeError(
+                "Cannot remove tables after server initialization. "
+                "Configure all tables before calling .server() or .app()."
+            )
+
+        if table_name not in self._data_sources:
+            available = ", ".join(self._data_sources.keys())
+            raise ValueError(f"Table '{table_name}' not found. Available: {available}")
+
+        if len(self._data_sources) == 1:
+            raise ValueError(
+                "Cannot remove last table. At least one table is required."
+            )
+
+        removed_source = self._data_sources[table_name]
+        next_data_sources = dict(self._data_sources)
+        del next_data_sources[table_name]
+
+        self._build_system_prompt(data_sources=next_data_sources)
+        self._data_sources = next_data_sources
+        if self._query_executor is not None:
+            with contextlib.suppress(Exception):
+                self._query_executor.cleanup()
+            self._query_executor = None
+        removed_source.cleanup()
+
+    def _mark_server_initialized(self) -> None:
+        """Mark that the server has been initialized. Prevents add/remove_table."""
+        self._server_initialized = True
 
     def cleanup(self) -> None:
-        """Clean up resources associated with the data source."""
-        if self._data_source is not None:
-            self._data_source.cleanup()
+        """Clean up resources associated with all data sources."""
+        if self._query_executor is not None:
+            self._query_executor.cleanup()
+        for source in self._data_sources.values():
+            source.cleanup()
 
 
 def normalize_data_source(
@@ -330,6 +642,24 @@ def normalize_data_source(
     )
 
 
+def cleanup_failed_staged_source(
+    original_source: IntoFrame | sqlalchemy.Engine | BaseBoard | DataSource,
+    normalized_source: DataSource,
+) -> None:
+    """
+    Clean up transient resources created during a failed staged rebuild.
+
+    DataFrameSource and PinSource both allocate disposable connections during
+    normalization. SQLAlchemySource wraps a caller-owned engine, while
+    PolarsLazySource and IbisSource do not allocate disposable resources here.
+    """
+    if isinstance(original_source, (DataSource, sqlalchemy.Engine)):
+        return
+
+    if isinstance(normalized_source, (DataFrameSource, PinSource)):
+        normalized_source.cleanup()
+
+
 def create_client(client: str | chatlas.Chat | None) -> chatlas.Chat:
     """Resolve a client spec into a fresh Chat with no conversation history."""
     if client is None:
@@ -371,3 +701,175 @@ def normalize_tools(
             "vl-convert-python. Install them with: pip install querychat[viz]"
         )
     return resolved
+
+
+def _normalize_data_dicts(
+    data_dict: DataDict | str | Path | list[DataDict | str | Path] | None,
+) -> list[DataDict]:
+    from ._data_dict import DataDict as _DataDict
+
+    if data_dict is None:
+        return []
+    if isinstance(data_dict, list):
+        return [
+            _DataDict.from_yaml(item) if isinstance(item, (str, Path)) else item
+            for item in data_dict
+        ]
+    if isinstance(data_dict, (str, Path)):
+        return [_DataDict.from_yaml(data_dict)]
+    return [data_dict]
+
+
+def _get_table_sql(state: AppStateDict | None, table: str) -> str | None:
+    """Extract the SQL for a specific table from a serialized state dict."""
+    if state is None:
+        return None
+    per_table = state.get("table_states")
+    if per_table and table in per_table:
+        return per_table[table].get("sql")
+    # Backward compat: if table matches the active table and no table_states key exists
+    if state.get("table") == table:
+        return state.get("sql")
+    return None
+
+
+class StateDictQueryChat(QueryChatBase[IntoFrameT]):
+    """Base for Dash and Gradio adapters that pass serialized state dicts per request."""
+
+    def _client_factory(
+        self,
+        update_cb: Callable[[UpdateDashboardData], None],
+        reset_cb: Callable[[str], None],
+    ) -> chatlas.Chat:
+        """Create a chat client with dashboard callbacks."""
+        return self.client(update_dashboard=update_cb, reset_dashboard=reset_cb)
+
+    def _df_for_source(
+        self, data_source: DataSource[IntoFrameT], sql: str | None
+    ) -> IntoFrameT:
+        if sql:
+            with contextlib.suppress(Exception):
+                return self._require_query_executor("df").execute_query(sql)
+        return data_source.get_data()
+
+    def df(self, state: AppStateDict | None, *, table: str | None = None) -> IntoFrameT:
+        """
+        Get the current DataFrame from state.
+
+        Parameters
+        ----------
+        state
+            The state dictionary from a framework callback.
+        table
+            Table name to read. Defaults to the active table when None.
+
+        Returns
+        -------
+        :
+            The filtered data if a SQL query is active, otherwise the full dataset.
+            Returns a LazyFrame if the data source is lazy.
+
+        """
+        if table is not None:
+            return self._df_for_source(
+                self._data_sources[table], _get_table_sql(state, table)
+            )
+        if len(self._data_sources) > 1:
+            primary_name = next(iter(self._data_sources))
+            table_list = ", ".join(f"'{n}'" for n in self._data_sources)
+            warn_multi_table_flat_accessor("df", primary_name, table_list)
+            return self._df_for_source(
+                self._data_sources[primary_name], _get_table_sql(state, primary_name)
+            )
+        data_source = self._get_state_data_source(state)
+        return self._df_for_source(data_source, state.get("sql") if state else None)
+
+    def _get_state_data_source(
+        self, state: AppStateDict | None
+    ) -> DataSource[IntoFrameT]:
+        """Resolve the full-data source for a serialized state payload."""
+        self._require_initialized("_get_state_data_source")
+        first_source: DataSource[IntoFrameT] = next(iter(self._data_sources.values()))
+        if not state:
+            return first_source
+        table_name = state.get("table")
+        if table_name is not None and table_name in self._data_sources:
+            return self._data_sources[table_name]
+        return first_source
+
+    def sql(self, state: AppStateDict | None, *, table: str | None = None) -> str | None:
+        """
+        Get the current SQL query from state.
+
+        Parameters
+        ----------
+        state
+            The state dictionary from a framework callback.
+        table
+            Table name. Defaults to the active table when None.
+
+        Returns
+        -------
+        :
+            The current SQL query, or None if showing full dataset.
+
+        """
+        if table is not None:
+            return _get_table_sql(state, table)
+        if len(self._data_sources) > 1:
+            primary_name = next(iter(self._data_sources))
+            table_list = ", ".join(f"'{n}'" for n in self._data_sources)
+            warn_multi_table_flat_accessor("sql", primary_name, table_list)
+            return _get_table_sql(state, primary_name)
+        return state.get("sql") if state else None
+
+    def _title_for_table(
+        self, state: AppStateDict | None, table: str
+    ) -> str | None:
+        if state is None:
+            return None
+        per_table = state.get("table_states")
+        if per_table and table in per_table:
+            return per_table[table].get("title")
+        if state.get("table") == table:
+            return state.get("title")
+        return None
+
+    def title(self, state: AppStateDict | None, *, table: str | None = None) -> str | None:
+        """
+        Get the current query title from state.
+
+        Parameters
+        ----------
+        state
+            The state dictionary from a framework callback.
+        table
+            Table name. Defaults to the active table when None.
+
+        Returns
+        -------
+        :
+            A short description of the current filter, or None if showing full dataset.
+
+        """
+        if table is not None:
+            return self._title_for_table(state, table)
+        if len(self._data_sources) > 1:
+            primary_name = next(iter(self._data_sources))
+            table_list = ", ".join(f"'{n}'" for n in self._data_sources)
+            warn_multi_table_flat_accessor("title", primary_name, table_list)
+            return self._title_for_table(state, primary_name)
+        return state.get("title") if state else None
+
+    def _deserialize_state(self, state_data: AppStateDict | None) -> AppState:
+        """Reconstruct AppState from a serialized state dict."""
+        self._require_initialized("_deserialize_state")
+        state = create_app_state(
+            data_sources=dict(self._data_sources),
+            client_factory=self._client_factory,
+            greeting=self.greeting,
+            query_executor=self._require_query_executor("_deserialize_state"),
+        )
+        if state_data:
+            state.update_from_dict(state_data)
+        return state
diff --git a/pkg-py/src/querychat/_querychat_core.py b/pkg-py/src/querychat/_querychat_core.py
index fb3134beb..87d110ab7 100644
--- a/pkg-py/src/querychat/_querychat_core.py
+++ b/pkg-py/src/querychat/_querychat_core.py
@@ -7,19 +7,19 @@
     "AppState",
     "AppStateDict",
     "ClientFactory",
-    "StateDictAccessorMixin",
     "create_app_state",
     "stream_response",
     "stream_response_async",
 ]
 
+import warnings
 from collections.abc import Callable
 from dataclasses import dataclass
-from typing import TYPE_CHECKING, Generic, Optional, TypedDict, Union
+from typing import TYPE_CHECKING, Optional, TypedDict, Union
 
 from chatlas import Chat, ContentToolRequest, ContentToolResult
 from chatlas.types import Content
-from narwhals.stable.v1.typing import IntoFrameT
+from typing_extensions import NotRequired
 
 from .tools import UpdateDashboardData
 
@@ -36,21 +36,46 @@
     from narwhals.stable.v1.typing import IntoFrame
 
     from ._datasource import DataSource
+    from ._query_executor import QueryExecutor
 
 
 ClientFactory = Callable[
-    [Callable[[UpdateDashboardData], None], Callable[[], None]],
+    [Callable[[UpdateDashboardData], None], Callable[[str], None]],
     Chat,
 ]
 """Factory that creates a Chat client with update_dashboard and reset_dashboard callbacks."""
 
 
+def warn_multi_table_flat_accessor(
+    accessor_name: str, primary_table: str, table_list: str, stacklevel: int = 3
+) -> None:
+    """Emit a FutureWarning when a flat accessor is used with multiple tables registered."""
+    warnings.warn(
+        f".{accessor_name}() called without a table name, but multiple tables are registered "
+        f"({table_list}). Defaulting to primary table '{primary_table}'. "
+        f"Use .table('{primary_table}').{accessor_name}() to suppress this warning. "
+        f"In a future version of querychat, this will raise an error.",
+        FutureWarning,
+        stacklevel=stacklevel,
+    )
+
+
+class TableStateData(TypedDict):
+    """Per-table state for serialization."""
+
+    sql: str | None
+    title: str | None
+    error: str | None
+
+
 class AppStateDict(TypedDict):
     """Serialized AppState for framework state stores."""
 
+    table: NotRequired[str | None]
     sql: str | None
     title: str | None
     error: str | None
+    table_states: NotRequired[dict[str, TableStateData]]
     turns: list[dict]  # Serialized chatlas Turns via model_dump()
 
 
@@ -61,91 +86,6 @@ class DisplayMessage(TypedDict):
     content: str
 
 
-class StateDictAccessorMixin(Generic[IntoFrameT]):
-    """Mixin providing df/sql/title accessors for frameworks using serialized state dicts."""
-
-    _data_source: DataSource[IntoFrameT] | None
-
-    def _client_factory(
-        self,
-        update_cb: Callable[[UpdateDashboardData], None],
-        reset_cb: Callable[[], None],
-    ) -> Chat:
-        """Create a chat client with dashboard callbacks."""
-        return self.client(update_dashboard=update_cb, reset_dashboard=reset_cb)  # type: ignore[attr-defined]
-
-    def df(self, state: AppStateDict | None) -> IntoFrameT:
-        """
-        Get the current DataFrame from state.
-
-        Parameters
-        ----------
-        state
-            The state dictionary from a framework callback.
-
-        Returns
-        -------
-        :
-            The filtered data if a SQL query is active, otherwise the full dataset.
-            Returns a LazyFrame if the data source is lazy.
-
-        """
-        data_source = self._require_data_source("df")  # type: ignore[attr-defined]
-        sql = state.get("sql") if state else None
-        if sql:
-            try:
-                return data_source.execute_query(sql)
-            except Exception:
-                return data_source.get_data()
-        return data_source.get_data()
-
-    def sql(self, state: AppStateDict | None) -> str | None:
-        """
-        Get the current SQL query from state.
-
-        Parameters
-        ----------
-        state
-            The state dictionary from a framework callback.
-
-        Returns
-        -------
-        :
-            The current SQL query, or None if showing full dataset.
-
-        """
-        return state.get("sql") if state else None
-
-    def title(self, state: AppStateDict | None) -> str | None:
-        """
-        Get the current query title from state.
-
-        Parameters
-        ----------
-        state
-            The state dictionary from a framework callback.
-
-        Returns
-        -------
-        :
-            A short description of the current filter, or None if showing full dataset.
-
-        """
-        return state.get("title") if state else None
-
-    def _deserialize_state(self, state_data: AppStateDict | None) -> AppState:
-        """Reconstruct AppState from a serialized state dict."""
-        data_source = self._require_data_source("_deserialize_state")  # type: ignore[attr-defined]
-        state = create_app_state(
-            data_source,
-            self._client_factory,
-            self.greeting,  # type: ignore[attr-defined]
-        )
-        if state_data:
-            state.update_from_dict(state_data)
-        return state
-
-
 def format_chunk(chunk: Union[str, Content]) -> str:
     """Extract displayable text from a chat chunk."""
     if isinstance(chunk, ContentToolRequest):
@@ -163,7 +103,9 @@ def format_tool_result(result: ContentToolResult) -> str:
     display_info = result.extra.get("display") if result.extra else None
     if display_info and hasattr(display_info, "markdown"):
         return display_info.markdown
-    return str(result)
+    if result.value is not None:
+        return str(result.value)
+    return ""
 
 
 
@@ -199,41 +141,93 @@ def format_query_error(e: Exception) -> str:
 class AppState:
     """Framework-agnostic application state for a querychat session."""
 
-    data_source: DataSource
+    data_sources: dict[str, DataSource]
     client: Chat
+    query_executor: QueryExecutor | None = None
     greeting: Optional[str] = None
 
-    sql: Optional[str] = None
-    title: Optional[str] = None
-    error: Optional[str] = None
+    active_table: str | None = None
+    # sql, title, error are per-table properties backed by _table_states
 
-    def update_dashboard(self, data: UpdateDashboardData) -> None:
-        self.sql = data["query"]
-        self.title = data["title"]
-        self.error = None  # Clear any previous error on successful update
+    def __post_init__(self) -> None:
+        if self.active_table is None:
+            self.active_table = next(iter(self.data_sources))
+        self._table_states: dict[str, dict[str, str | None]] = {
+            name: {"sql": None, "title": None, "error": None}
+            for name in self.data_sources
+        }
 
-    def reset_dashboard(self) -> None:
+    def _get_active_state(self) -> dict[str, str | None]:
+        table = self.active_table or next(iter(self.data_sources))
+        if table not in self._table_states:
+            self._table_states[table] = {"sql": None, "title": None, "error": None}
+        return self._table_states[table]
+
+    @property
+    def sql(self) -> str | None:
+        return self._get_active_state()["sql"]
+
+    @sql.setter
+    def sql(self, value: str | None) -> None:
+        self._get_active_state()["sql"] = value
+
+    @property
+    def title(self) -> str | None:
+        return self._get_active_state()["title"]
+
+    @title.setter
+    def title(self, value: str | None) -> None:
+        self._get_active_state()["title"] = value
+
+    @property
+    def error(self) -> str | None:
+        return self._get_active_state()["error"]
+
+    @error.setter
+    def error(self, value: str | None) -> None:
+        self._get_active_state()["error"] = value
+
+    def update_dashboard(self, data: UpdateDashboardData) -> None:
+        table_name = data["table"]
+        self.active_table = table_name
+        if table_name not in self._table_states:
+            self._table_states[table_name] = {"sql": None, "title": None, "error": None}
+        self._table_states[table_name]["sql"] = data["query"]
+        self._table_states[table_name]["title"] = data["title"]
+        self._table_states[table_name]["error"] = None
+
+    def reset_dashboard(self, table: str | None = None) -> None:
+        if table is not None:
+            self.active_table = table
         self.sql = None
         self.title = None
         self.error = None
 
+    def get_active_data_source(self) -> DataSource:
+        """Return the current full-data source for the active table."""
+        if self.active_table is not None and self.active_table in self.data_sources:
+            return self.data_sources[self.active_table]
+        return next(iter(self.data_sources.values()))
+
     def get_current_data(self) -> IntoFrame:
         """Get current data, falling back to default if query fails."""
+        data_source = self.get_active_data_source()
         if self.sql:
             try:
-                result = self.data_source.execute_query(self.sql)
+                query_runner = self.query_executor or data_source
+                result = query_runner.execute_query(self.sql)
                 self.error = None  # Clear error on success
                 return result
             except Exception as e:
                 self.error = format_query_error(e)
                 self.sql = None
                 self.title = None
-                return self.data_source.get_data()
-        self.error = None
-        return self.data_source.get_data()
+                return data_source.get_data()
+        return data_source.get_data()
 
     def get_display_sql(self) -> str:
-        return self.sql or f"SELECT * FROM {self.data_source.table_name}"
+        table_name = self.active_table or next(iter(self.data_sources))
+        return self.sql or f"SELECT * FROM {table_name}"
 
     def get_display_messages(self) -> list[DisplayMessage]:
         """
@@ -280,9 +274,14 @@ def initialize_greeting_if_preset(self) -> bool:
     def to_dict(self) -> AppStateDict:
         """Serialize state to dict for framework state stores."""
         return {
+            "table": self.active_table,
             "sql": self.sql,
             "title": self.title,
             "error": self.error,
+            "table_states": {
+                name: {"sql": ts["sql"], "title": ts["title"], "error": ts["error"]}
+                for name, ts in self._table_states.items()
+            },
             "turns": [turn.model_dump() for turn in self.client.get_turns()],
         }
 
@@ -290,9 +289,22 @@ def update_from_dict(self, data: AppStateDict) -> None:
         """Restore state from serialized dict."""
         from chatlas import Turn
 
-        self.sql = data["sql"]
-        self.title = data["title"]
-        self.error = data["error"]
+        self.active_table = data.get("table", next(iter(self.data_sources)))
+
+        per_table = data.get("table_states")
+        if per_table:
+            for name, ts in per_table.items():
+                if name in self._table_states:
+                    self._table_states[name]["sql"] = ts.get("sql")
+                    self._table_states[name]["title"] = ts.get("title")
+                    self._table_states[name]["error"] = ts.get("error")
+        else:
+            # Backward compat: restore single active-table state from flat fields.
+            active = self.active_table or next(iter(self.data_sources))
+            if active in self._table_states:
+                self._table_states[active]["sql"] = data["sql"]
+                self._table_states[active]["title"] = data["title"]
+                self._table_states[active]["error"] = data["error"]
 
         turns_data = data["turns"]
         turns = [Turn.model_validate(t) for t in turns_data]
@@ -300,9 +312,11 @@ def update_from_dict(self, data: AppStateDict) -> None:
 
 
 def create_app_state(
-    data_source: DataSource,
+    *,
+    data_sources: dict[str, DataSource],
     client_factory: ClientFactory,
     greeting: Optional[str] = None,
+    query_executor: QueryExecutor | None = None,
 ) -> AppState:
     """Create AppState with callbacks connected via holder pattern."""
     state_holder: dict[str, AppState | None] = {"state": None}
@@ -313,16 +327,17 @@ def update_callback(data: UpdateDashboardData) -> None:
             raise RuntimeError("Callback invoked before state initialization")
         state.update_dashboard(data)
 
-    def reset_callback() -> None:
+    def reset_callback(_table: str) -> None:
         state = state_holder["state"]
         if state is None:
             raise RuntimeError("Callback invoked before state initialization")
-        state.reset_dashboard()
+        state.reset_dashboard(_table)
 
     client = client_factory(update_callback, reset_callback)
     state = AppState(
-        data_source=data_source,
+        data_sources=dict(data_sources),
         client=client,
+        query_executor=query_executor,
         greeting=greeting,
     )
     state_holder["state"] = state
diff --git a/pkg-py/src/querychat/_shiny.py b/pkg-py/src/querychat/_shiny.py
index 4bf0f2681..f616671fe 100644
--- a/pkg-py/src/querychat/_shiny.py
+++ b/pkg-py/src/querychat/_shiny.py
@@ -24,6 +24,9 @@
     import sqlalchemy
     from narwhals.stable.v1.typing import IntoFrame
 
+    from ._data_dict import DataDict
+    from ._table_accessor import TableAccessor
+
 
 class QueryChat(QueryChatBase[IntoFrameT]):
     """
@@ -112,13 +115,13 @@ class QueryChat(QueryChatBase[IntoFrameT]):
 
         The tools can be overridden per-client by passing a different `tools`
         parameter to the `.client()` method.
-    data_description
-        Description of the data in plain text or Markdown. If a pathlib.Path
-        object is passed, querychat will read the contents of the path into a
-        string with `.read_text()`.
-    categorical_threshold
-        Threshold for determining if a column is categorical based on number of
-        unique values.
+    data_dict
+        A :class:`~querychat.DataDict` instance, or a path (``str`` or
+        ``pathlib.Path``) to a YAML file, that provides rich per-table and
+        per-column metadata. When set, documented columns use the dict's
+        ``values``, ``range``, and ``description`` fields instead of querying
+        the data source for statistics, which speeds up schema generation and
+        improves LLM context. Supersedes ``data_description``.
     extra_instructions
         Additional instructions for the chat model. If a pathlib.Path object is
         passed, querychat will read the contents of the path into a string with
@@ -133,23 +136,30 @@ class QueryChat(QueryChatBase[IntoFrameT]):
           `data_source.get_schema()`
         - `{{data_description}}`: The optional data description provided
         - `{{extra_instructions}}`: Any additional instructions provided
+    categorical_threshold
+        Threshold for determining if a column is categorical based on number of
+        unique values.
+    data_description
+        Optional plain-text or Markdown description of the data, as a string or
+        file path. Superseded by ``data_dict`` for new code.
 
     """
 
     @overload
     def __init__(
         self: QueryChat[Any],
-        data_source: None,
-        table_name: str,
+        data_source: None = None,
+        table_name: str | None = None,
         *,
         id: Optional[str] = None,
         greeting: Optional[str | Path] = None,
         client: Optional[str | chatlas.Chat] = None,
         tools: TOOL_GROUPS | tuple[TOOL_GROUPS, ...] | None = ("filter", "query"),
-        data_description: Optional[str | Path] = None,
-        categorical_threshold: int = 20,
+        data_dict: DataDict | str | Path | None = None,
         extra_instructions: Optional[str | Path] = None,
         prompt_template: Optional[str | Path] = None,
+        categorical_threshold: int = 20,
+        data_description: Optional[str | Path] = None,
     ) -> None: ...
 
     @overload
@@ -162,10 +172,11 @@ def __init__(
         greeting: Optional[str | Path] = None,
         client: Optional[str | chatlas.Chat] = None,
         tools: TOOL_GROUPS | tuple[TOOL_GROUPS, ...] | None = DEFAULT_TOOLS,
-        data_description: Optional[str | Path] = None,
-        categorical_threshold: int = 20,
+        data_dict: DataDict | str | Path | None = None,
         extra_instructions: Optional[str | Path] = None,
         prompt_template: Optional[str | Path] = None,
+        categorical_threshold: int = 20,
+        data_description: Optional[str | Path] = None,
     ) -> None: ...
 
     @overload
@@ -178,10 +189,11 @@ def __init__(
         greeting: Optional[str | Path] = None,
         client: Optional[str | chatlas.Chat] = None,
         tools: TOOL_GROUPS | tuple[TOOL_GROUPS, ...] | None = DEFAULT_TOOLS,
-        data_description: Optional[str | Path] = None,
-        categorical_threshold: int = 20,
+        data_dict: DataDict | str | Path | None = None,
         extra_instructions: Optional[str | Path] = None,
         prompt_template: Optional[str | Path] = None,
+        categorical_threshold: int = 20,
+        data_description: Optional[str | Path] = None,
     ) -> None: ...
 
     @overload
@@ -194,10 +206,11 @@ def __init__(
         greeting: Optional[str | Path] = None,
         client: Optional[str | chatlas.Chat] = None,
         tools: TOOL_GROUPS | tuple[TOOL_GROUPS, ...] | None = DEFAULT_TOOLS,
-        data_description: Optional[str | Path] = None,
-        categorical_threshold: int = 20,
+        data_dict: DataDict | str | Path | None = None,
         extra_instructions: Optional[str | Path] = None,
         prompt_template: Optional[str | Path] = None,
+        categorical_threshold: int = 20,
+        data_description: Optional[str | Path] = None,
     ) -> None: ...
 
     @overload
@@ -210,25 +223,27 @@ def __init__(
         greeting: Optional[str | Path] = None,
         client: Optional[str | chatlas.Chat] = None,
         tools: TOOL_GROUPS | tuple[TOOL_GROUPS, ...] | None = DEFAULT_TOOLS,
-        data_description: Optional[str | Path] = None,
-        categorical_threshold: int = 20,
+        data_dict: DataDict | str | Path | None = None,
         extra_instructions: Optional[str | Path] = None,
         prompt_template: Optional[str | Path] = None,
+        categorical_threshold: int = 20,
+        data_description: Optional[str | Path] = None,
     ) -> None: ...
 
     def __init__(
         self,
-        data_source: IntoFrame | sqlalchemy.Engine | ibis.Table | None,
-        table_name: str,
+        data_source: IntoFrame | sqlalchemy.Engine | ibis.Table | None = None,
+        table_name: str | None = None,
         *,
         id: Optional[str] = None,
         greeting: Optional[str | Path] = None,
         client: Optional[str | chatlas.Chat] = None,
         tools: TOOL_GROUPS | tuple[TOOL_GROUPS, ...] | None = DEFAULT_TOOLS,
-        data_description: Optional[str | Path] = None,
-        categorical_threshold: int = 20,
+        data_dict: DataDict | str | Path | None = None,
         extra_instructions: Optional[str | Path] = None,
         prompt_template: Optional[str | Path] = None,
+        categorical_threshold: int = 20,
+        data_description: Optional[str | Path] = None,
     ):
         super().__init__(
             data_source,
@@ -237,12 +252,12 @@ def __init__(
             client=client,
             tools=tools,
             data_description=data_description,
+            data_dict=data_dict,
             categorical_threshold=categorical_threshold,
             extra_instructions=extra_instructions,
             prompt_template=prompt_template,
         )
-        # Use table_name for ID since data_source might be None
-        self.id = id or f"querychat_{table_name}"
+        self.id = id or (f"querychat_{table_name}" if table_name else "querychat")
 
     def app(
         self, *, bookmark_store: Literal["url", "server", "disable"] = "url"
@@ -267,9 +282,9 @@ def app(
             A Shiny App object that can be run with `app.run()` or served with `shiny run`.
 
         """
-        data_source = self._require_data_source("app")
+        self._require_initialized("app")
         enable_bookmarking = bookmark_store != "disable"
-        table_name = data_source.table_name
+        first_table_name = next(iter(self._data_sources))
 
         def app_ui(request):
             return ui.page_sidebar(
@@ -291,33 +306,47 @@ def app_ui(request):
                     style="max-height: 33%;",
                 ),
                 ui.card(
-                    ui.card_header(bs_icon("table"), " Data"),
+                    ui.card_header(
+                        bs_icon("table"),
+                        " Data — ",
+                        ui.output_text("data_card_header_text", inline=True),
+                    ),
                     ui.output_data_frame("dt"),
                 ),
-                title=ui.span("querychat with ", ui.code(table_name)),
+                title=ui.span("querychat with ", ui.code(first_table_name)),
                 class_="bslib-page-dashboard",
                 fillable=True,
             )
 
         def app_server(input: Inputs, output: Outputs, session: Session):
+            self._mark_server_initialized()
             if enable_bookmarking:
                 session.bookmark.exclude.append("reset_query")
             vals = mod_server(
                 self.id,
-                data_source=data_source,
+                data_sources=dict(self._data_sources),
+                executor=self._require_query_executor("server"),
                 greeting=self.greeting,
                 client=self._create_session_client,
                 enable_bookmarking=enable_bookmarking,
                 tools=self.tools,
             )
 
+            @reactive.calc
+            def active_table_name() -> str:
+                return vals.current_table() or first_table_name
+
+            @render.text
+            def data_card_header_text():
+                return active_table_name()
+
             @render.text
             def query_title():
-                return vals.title() or "SQL Query"
+                return vals.table(active_table_name()).title() or "SQL Query"
 
             @render.ui
             def ui_reset():
-                req(vals.sql())
+                req(vals.table(active_table_name()).sql())
                 return ui.input_action_button(
                     "reset_query",
                     "Reset Query",
@@ -327,17 +356,20 @@ def ui_reset():
             @reactive.effect
             @reactive.event(input.reset_query)
             def _():
-                vals.sql.set(None)
-                vals.title.set(None)
+                name = active_table_name()
+                # TableAccessor is read-only; mutation requires direct TableState access
+                vals._tables[name].sql.set(None)
+                vals._tables[name].title.set(None)
 
             @render.data_frame
             def dt():
                 # Collect lazy sources (LazyFrame, Ibis Table) to eager DataFrame
-                return as_narwhals(vals.df())
+                return as_narwhals(vals.table(active_table_name()).df())
 
             @render.ui
             def sql_output():
-                sql_value = vals.sql() or f"SELECT * FROM {table_name}"
+                name = active_table_name()
+                sql_value = vals.table(name).sql() or f"SELECT * FROM {name}"
                 sql_code = f"```sql\n{sql_value}\n```"
                 return output_markdown_stream(
                     "sql_code",
@@ -412,7 +444,6 @@ def ui(self, *, id: Optional[str] = None, **kwargs):
     def server(
         self,
         *,
-        data_source: Optional[IntoFrame | sqlalchemy.Engine | ibis.Table] = None,
         client: str | chatlas.Chat | MISSING_TYPE = MISSING,
         enable_bookmarking: bool = False,
         id: Optional[str] = None,
@@ -427,10 +458,6 @@ def server(
 
         Parameters
         ----------
-        data_source
-            Optional data source to use. If provided, sets the data_source property
-            before initializing server logic. This is useful for the deferred pattern
-            where data_source is not known at initialization time.
         client
             Optional chat client to use for this session. If provided, overrides
             any client set at initialization time for this call only. This is useful
@@ -497,10 +524,7 @@ def title():
                 ".server() must be called within an active Shiny session (i.e., within the server function). "
             )
 
-        if data_source is not None:
-            self.data_source = data_source
-
-        resolved_data_source = self._require_data_source("server")
+        self._require_initialized("server")
         resolved_client_spec = self._client_spec if isinstance(client, MISSING_TYPE) else client
 
         def create_session_client(**kwargs) -> chatlas.Chat:
@@ -508,9 +532,11 @@ def create_session_client(**kwargs) -> chatlas.Chat:
                 client_spec=resolved_client_spec, **kwargs
             )
 
+        self._mark_server_initialized()
         return mod_server(
             id or self.id,
-            data_source=resolved_data_source,
+            data_sources=dict(self._data_sources),
+            executor=self._require_query_executor("server"),
             greeting=self.greeting,
             client=create_session_client,
             enable_bookmarking=enable_bookmarking,
@@ -589,13 +615,13 @@ def data_table():
         If `client` is not provided, querychat consults the
         `QUERYCHAT_CLIENT` environment variable. If that is not set, it
         defaults to `"openai"`.
-    data_description
-        Description of the data in plain text or Markdown. If a pathlib.Path
-        object is passed, querychat will read the contents of the path into a
-        string with `.read_text()`.
-    categorical_threshold
-        Threshold for determining if a column is categorical based on number of
-        unique values.
+    data_dict
+        A :class:`~querychat.DataDict` instance, or a path (``str`` or
+        ``pathlib.Path``) to a YAML file, that provides rich per-table and
+        per-column metadata. When set, documented columns use the dict's
+        ``values``, ``range``, and ``description`` fields instead of querying
+        the data source for statistics, which speeds up schema generation and
+        improves LLM context. Supersedes ``data_description``.
     extra_instructions
         Additional instructions for the chat model. If a pathlib.Path object is
         passed, querychat will read the contents of the path into a string with
@@ -610,6 +636,12 @@ def data_table():
           `data_source.get_schema()`
         - `{{data_description}}`: The optional data description provided
         - `{{extra_instructions}}`: Any additional instructions provided
+    categorical_threshold
+        Threshold for determining if a column is categorical based on number of
+        unique values.
+    data_description
+        Optional plain-text or Markdown description of the data, as a string or
+        file path. Superseded by ``data_dict`` for new code.
 
     """
 
@@ -619,17 +651,18 @@ def data_table():
     @overload
     def __init__(
         self: QueryChatExpress[Any],
-        data_source: None,
-        table_name: str,
+        data_source: None = None,
+        table_name: str | None = None,
         *,
         id: Optional[str] = None,
         greeting: Optional[str | Path] = None,
         client: Optional[str | chatlas.Chat] = None,
         tools: TOOL_GROUPS | tuple[TOOL_GROUPS, ...] | None = ("filter", "query"),
-        data_description: Optional[str | Path] = None,
-        categorical_threshold: int = 20,
+        data_dict: DataDict | str | Path | None = None,
         extra_instructions: Optional[str | Path] = None,
         prompt_template: Optional[str | Path] = None,
+        categorical_threshold: int = 20,
+        data_description: Optional[str | Path] = None,
         enable_bookmarking: Literal["auto", True, False] = "auto",
     ) -> None: ...
 
@@ -643,10 +676,11 @@ def __init__(
         greeting: Optional[str | Path] = None,
         client: Optional[str | chatlas.Chat] = None,
         tools: TOOL_GROUPS | tuple[TOOL_GROUPS, ...] | None = DEFAULT_TOOLS,
-        data_description: Optional[str | Path] = None,
-        categorical_threshold: int = 20,
+        data_dict: DataDict | str | Path | None = None,
         extra_instructions: Optional[str | Path] = None,
         prompt_template: Optional[str | Path] = None,
+        categorical_threshold: int = 20,
+        data_description: Optional[str | Path] = None,
         enable_bookmarking: Literal["auto", True, False] = "auto",
     ) -> None: ...
 
@@ -660,10 +694,11 @@ def __init__(
         greeting: Optional[str | Path] = None,
         client: Optional[str | chatlas.Chat] = None,
         tools: TOOL_GROUPS | tuple[TOOL_GROUPS, ...] | None = DEFAULT_TOOLS,
-        data_description: Optional[str | Path] = None,
-        categorical_threshold: int = 20,
+        data_dict: DataDict | str | Path | None = None,
         extra_instructions: Optional[str | Path] = None,
         prompt_template: Optional[str | Path] = None,
+        categorical_threshold: int = 20,
+        data_description: Optional[str | Path] = None,
         enable_bookmarking: Literal["auto", True, False] = "auto",
     ) -> None: ...
 
@@ -677,10 +712,11 @@ def __init__(
         greeting: Optional[str | Path] = None,
         client: Optional[str | chatlas.Chat] = None,
         tools: TOOL_GROUPS | tuple[TOOL_GROUPS, ...] | None = DEFAULT_TOOLS,
-        data_description: Optional[str | Path] = None,
-        categorical_threshold: int = 20,
+        data_dict: DataDict | str | Path | None = None,
         extra_instructions: Optional[str | Path] = None,
         prompt_template: Optional[str | Path] = None,
+        categorical_threshold: int = 20,
+        data_description: Optional[str | Path] = None,
         enable_bookmarking: Literal["auto", True, False] = "auto",
     ) -> None: ...
 
@@ -694,26 +730,28 @@ def __init__(
         greeting: Optional[str | Path] = None,
         client: Optional[str | chatlas.Chat] = None,
         tools: TOOL_GROUPS | tuple[TOOL_GROUPS, ...] | None = DEFAULT_TOOLS,
-        data_description: Optional[str | Path] = None,
-        categorical_threshold: int = 20,
+        data_dict: DataDict | str | Path | None = None,
         extra_instructions: Optional[str | Path] = None,
         prompt_template: Optional[str | Path] = None,
+        categorical_threshold: int = 20,
+        data_description: Optional[str | Path] = None,
         enable_bookmarking: Literal["auto", True, False] = "auto",
     ) -> None: ...
 
     def __init__(
         self,
-        data_source: IntoFrame | sqlalchemy.Engine | ibis.Table | None,
-        table_name: str,
+        data_source: IntoFrame | sqlalchemy.Engine | ibis.Table | None = None,
+        table_name: str | None = None,
         *,
         id: Optional[str] = None,
         greeting: Optional[str | Path] = None,
         client: Optional[str | chatlas.Chat] = None,
         tools: TOOL_GROUPS | tuple[TOOL_GROUPS, ...] | None = DEFAULT_TOOLS,
-        data_description: Optional[str | Path] = None,
-        categorical_threshold: int = 20,
+        data_dict: DataDict | str | Path | None = None,
         extra_instructions: Optional[str | Path] = None,
         prompt_template: Optional[str | Path] = None,
+        categorical_threshold: int = 20,
+        data_description: Optional[str | Path] = None,
         enable_bookmarking: Literal["auto", True, False] = "auto",
     ):
         # Sanity check: Express should always have a (stub/real) session
@@ -731,11 +769,12 @@ def __init__(
             client=client,
             tools=tools,
             data_description=data_description,
+            data_dict=data_dict,
             categorical_threshold=categorical_threshold,
             extra_instructions=extra_instructions,
             prompt_template=prompt_template,
         )
-        self.id = id or f"querychat_{table_name}"
+        self.id = id or (f"querychat_{table_name}" if table_name else "querychat")
 
         # Determine bookmarking setting
         # During stub session: detect from app_opts and cache in class variable
@@ -753,12 +792,34 @@ def __init__(
         else:
             enable = enable_bookmarking
 
+        self._enable_bookmarking = enable
+        self._vals: ServerValues[IntoFrameT] | None = None
+
+    def _ensure_server_started(self) -> None:
+        """
+        Start the Shiny module server if not already started.
+
+        Called lazily from ui()/sidebar() and the reactive accessors so that
+        module-level add_table() calls (which happen after __init__ but before
+        sidebar()/ui()) can complete before server initialization locks the
+        table set.
+        """
+        if self._server_initialized:
+            return
+        session = get_current_session()
+        if isinstance(session, ExpressStubSession):
+            return
+        if not self._data_sources:
+            return
+        self._require_initialized("_ensure_server_started")
+        self._mark_server_initialized()
         self._vals = mod_server(
             self.id,
-            data_source=self._data_source,
+            data_sources=dict(self._data_sources),
+            executor=self._require_query_executor("_ensure_server_started"),
             greeting=self.greeting,
             client=self._create_session_client,
-            enable_bookmarking=enable,
+            enable_bookmarking=self._enable_bookmarking,
             tools=self.tools,
         )
 
@@ -821,7 +882,18 @@ def ui(self, *, id: Optional[str] = None, **kwargs):
             A UI component.
 
         """
-        return mod_ui(id or self.id, preload_viz=has_viz_tool(self.tools), greeting=self.greeting, **kwargs)
+        result = mod_ui(id or self.id, preload_viz=has_viz_tool(self.tools), greeting=self.greeting, **kwargs)
+        self._ensure_server_started()
+        return result
+
+    def _require_vals(self) -> ServerValues[IntoFrameT]:
+        self._ensure_server_started()
+        if self._vals is None:
+            raise RuntimeError(
+                "QueryChat server is not initialized. "
+                "Ensure add_table() is called and sidebar()/ui() has been rendered."
+            )
+        return self._vals
 
     def df(self) -> IntoFrameT:
         """
@@ -836,7 +908,7 @@ def df(self) -> IntoFrameT:
             data source.
 
         """
-        return self._vals.df()
+        return self._require_vals().df()
 
     @overload
     def sql(self, query: None = None) -> str | None: ...
@@ -863,9 +935,9 @@ def sql(self, query: Optional[str] = None) -> str | None | bool:
 
         """
         if query is None:
-            return self._vals.sql()
+            return self._require_vals().sql()
         else:
-            return self._vals.sql.set(query)
+            return self._require_vals().sql.set(query)
 
     @overload
     def title(self, value: None = None) -> str | None: ...
@@ -897,6 +969,58 @@ def title(self, value: Optional[str] = None) -> str | None | bool:
 
         """
         if value is None:
-            return self._vals.title()
+            return self._require_vals().title()
         else:
-            return self._vals.title.set(value)
+            return self._require_vals().title.set(value)
+
+    def table(self, name: str) -> TableAccessor:
+        """
+        Get a per-table accessor with reactive state.
+
+        Parameters
+        ----------
+        name
+            Table name (must match a name passed to ``add_table()``).
+
+        Returns
+        -------
+        TableAccessor
+            Accessor with ``df()``, ``sql()``, and ``title()`` backed by
+            per-session reactive state.
+
+        Examples
+        --------
+        ```python
+        from querychat.express import QueryChat
+        from shiny.express import render
+
+        qc = QueryChat(orders, "orders")
+        qc.add_table(customers, "customers")
+        qc.sidebar()
+
+        @render.data_frame
+        def orders_table():
+            return qc.table("orders").df()
+
+        @render.data_frame
+        def customers_table():
+            return qc.table("customers").df()
+        ```
+
+        """
+        return self._require_vals().table(name)
+
+    def current_table(self) -> str | None:
+        """
+        Reactively read the name of the most recently queried table.
+
+        Returns ``None`` if no query has run yet in this session. Useful for
+        auto-switching a tabbed UI to the active table.
+
+        Returns
+        -------
+        str or None
+            Table name, or ``None``.
+
+        """
+        return self._require_vals().current_table()
diff --git a/pkg-py/src/querychat/_shiny_module.py b/pkg-py/src/querychat/_shiny_module.py
index 95d4882e6..f0b3e8d4d 100644
--- a/pkg-py/src/querychat/_shiny_module.py
+++ b/pkg-py/src/querychat/_shiny_module.py
@@ -12,7 +12,8 @@
 
 from shiny import module, reactive, ui
 
-from ._querychat_core import GREETING_PROMPT
+from ._querychat_core import GREETING_PROMPT, warn_multi_table_flat_accessor
+from ._table_accessor import TableAccessor
 from ._viz_altair_widget import AltairWidget
 from ._viz_ggsql import execute_ggsql
 from ._viz_utils import has_viz_tool, preload_viz_deps_server, preload_viz_deps_ui
@@ -25,6 +26,7 @@
     from shiny import Inputs, Outputs, Session
 
     from ._datasource import DataSource
+    from ._query_executor import QueryExecutor
     from ._viz_tools import VisualizeData
     from .types import UpdateDashboardData
 
@@ -56,6 +58,16 @@ def __getattr__(self, _name: str):
 ServerClient = chatlas.Chat | _DeferredStubChatClient
 
 
+@dataclass
+class TableState(Generic[IntoFrameT]):
+    """Per-table reactive state."""
+
+    sql: ReactiveStringOrNone
+    title: ReactiveStringOrNone
+    df: Callable[[], IntoFrameT]
+
+
+
 @module.ui
 def mod_ui(*, preload_viz: bool = False, greeting: str | None = None, **kwargs):
     css_path = Path(__file__).parent / "static" / "css" / "styles.css"
@@ -80,43 +92,115 @@ def mod_ui(*, preload_viz: bool = False, greeting: str | None = None, **kwargs):
     )
 
 
-@dataclass
+class _MultiTableWarnReactive:
+    """Proxy that warns once per session and delegates to the primary table's reactive value."""
+
+    def __init__(
+        self,
+        primary: ReactiveStringOrNone,
+        accessor_name: str,
+        primary_table: str,
+        table_list: str,
+    ) -> None:
+        self._primary = primary
+        self._accessor_name = accessor_name
+        self._primary_table = primary_table
+        self._table_list = table_list
+        self._warned = False
+
+    def _warn(self) -> None:
+        if not self._warned:
+            self._warned = True
+            warn_multi_table_flat_accessor(
+                self._accessor_name, self._primary_table, self._table_list, stacklevel=4
+            )
+
+    def __call__(self) -> str | None:
+        self._warn()
+        return self._primary.get()
+
+    def get(self) -> str | None:
+        self._warn()
+        return self._primary.get()
+
+    def set(self, value: str | None) -> None:
+        self._primary.set(value)
+
+
 class ServerValues(Generic[IntoFrameT]):
     """
     Session-specific reactive values and client returned by QueryChat.server().
 
-    This dataclass contains all the session-specific reactive state for a QueryChat
-    instance. Each session gets its own ServerValues to ensure proper isolation
+    Each session gets its own ServerValues to ensure proper isolation
     between concurrent sessions.
 
     Attributes
     ----------
     df
-        A reactive Calc that returns the current filtered data frame or lazy frame.
-        If the data source is lazy, returns a LazyFrame. If no SQL query has been
-        set, this returns the unfiltered data from the data source.
-        Call it like `.df()` to reactively read the current data.
+        Reactive Calc returning the current filtered data frame.
+        With multiple tables, warns and defaults to the primary table; use ``.table('name').df()``.
     sql
-        A reactive Value containing the current SQL query string. Access the value
-        by calling `.sql()`, or set it with `.sql.set("SELECT ...")`.
-        Returns `None` if no query has been set.
+        Reactive Value for the current SQL query string.
+        With multiple tables, warns and defaults to the primary table; use ``.table('name').sql``.
     title
-        A reactive Value containing the current title for the query. The LLM
-        provides this title when generating a new SQL query. Access it with
-        `.title()`, or set it with `.title.set("...")`. Returns
-        `None` if no title has been set.
+        Reactive Value for the current title.
+        With multiple tables, warns and defaults to the primary table; use ``.table('name').title``.
+    tables
+        Per-table reactive state dict. Keys are table names.
     client
-        Session chat client value.
-        For real sessions this is a `chatlas.Chat` created by the client
-        factory. For deferred stub sessions (where `data_source` is not set
-        yet), this is a placeholder client that raises when accessed.
+        Session chat client.
+    current_table
+        The name of the most recently queried table, or ``None`` if no query
+        has been run yet. Call ``.current_table()`` to read reactively.
 
     """
 
-    df: Callable[[], IntoFrameT]
-    sql: ReactiveStringOrNone
-    title: ReactiveStringOrNone
-    client: ServerClient
+    def __init__(
+        self,
+        *,
+        df: Callable[[], IntoFrameT],
+        sql: ReactiveStringOrNone,
+        title: ReactiveStringOrNone,
+        tables: dict[str, TableState[IntoFrameT]],
+        client: ServerClient,
+        data_sources: dict[str, DataSource[IntoFrameT]],
+        current_table: ReactiveStringOrNone,
+    ):
+        self.df = df
+        self.sql = sql
+        self.title = title
+        self._tables = tables
+        self.client = client
+        self._data_sources = data_sources
+        self._current_table_rv = current_table
+
+    def table(self, name: str) -> TableAccessor:
+        """
+        Get a per-table accessor with reactive state.
+
+        Parameters
+        ----------
+        name
+            Table name.
+
+        Returns
+        -------
+        TableAccessor
+            Accessor with df(), sql(), title() backed by per-session state.
+
+        """
+        if name not in self._tables:
+            available = ", ".join(f"'{n}'" for n in self._tables)
+            raise ValueError(f"Table '{name}' not found. Available: {available}")
+        return TableAccessor(name, self._data_sources[name], state=self._tables[name])
+
+    def table_names(self) -> list[str]:
+        """Return the names of all registered tables."""
+        return list(self._tables.keys())
+
+    def current_table(self) -> str | None:
+        """Return the name of the most recently queried table, or None (reactive)."""
+        return self._current_table_rv.get()
 
 
 @module.server
@@ -125,15 +209,13 @@ def mod_server(
     output: Outputs,
     session: Session,
     *,
-    data_source: DataSource[IntoFrameT] | None,
+    data_sources: dict[str, DataSource[IntoFrameT]] | None,
+    executor: QueryExecutor | None,
     greeting: str | None,
     client: Callable[..., chatlas.Chat],
     enable_bookmarking: bool,
     tools: set[str] | None = None,
 ) -> ServerValues[IntoFrameT]:
-    # Reactive values to store state
-    sql = ReactiveStringOrNone(None)
-    title = ReactiveStringOrNone(None)
     # Holds a generated greeting so it can be saved and restored on bookmark.
     # Static greetings live in the UI (chat_ui(greeting=)) and persist already.
     # Workaround for posit-dev/shinychat#253: shinychat does not bookmark
@@ -145,13 +227,36 @@ def mod_server(
     if not callable(client):
         raise TypeError("mod_server() requires a callable client factory.")
 
-    def update_dashboard(data: UpdateDashboardData):
-        sql.set(data["query"])
-        title.set(data["title"])
+    table_states: dict[str, TableState[IntoFrameT]] = {}
+    _current_table: ReactiveStringOrNone = ReactiveStringOrNone(None)
+
+    def _make_table_state(
+        source: DataSource[IntoFrameT], exec: QueryExecutor
+    ) -> TableState[IntoFrameT]:
+        table_sql = ReactiveStringOrNone(None)
+        table_title = ReactiveStringOrNone(None)
+
+        @reactive.calc
+        def filtered_df() -> IntoFrameT:
+            query = table_sql.get()
+            if query:
+                return exec.execute_query(query)
+            return source.get_data()
 
-    def reset_dashboard():
-        sql.set(None)
-        title.set(None)
+        return TableState(sql=table_sql, title=table_title, df=filtered_df)
+
+    def update_dashboard(data: UpdateDashboardData):
+        table_name = data["table"]
+        if table_name in table_states:
+            table_states[table_name].sql.set(data["query"])
+            table_states[table_name].title.set(data["title"])
+            _current_table.set(table_name)
+
+    def reset_dashboard(table_name: str):
+        if table_name in table_states:
+            table_states[table_name].sql.set(None)
+            table_states[table_name].title.set(None)
+            _current_table.set(table_name)
 
     viz_widgets: list[VizWidgetEntry] = []
 
@@ -167,43 +272,42 @@ def build_chat_client() -> chatlas.Chat:
         )
 
     # Short-circuit for stub sessions (e.g. 1st run of an Express app)
-    # data_source may be None during stub session for deferred pattern
+    # data_sources may be None during stub session for deferred pattern
     if session.is_stub_session():
         # Mock the error that would otherwise occur in a real session
         def _stub_df():
             raise RuntimeError("RuntimeError: No current reactive context")
 
         stub_client = (
-            _DeferredStubChatClient() if data_source is None else build_chat_client()
+            _DeferredStubChatClient() if data_sources is None else build_chat_client()
         )
 
         return ServerValues(
             df=_stub_df,
-            sql=sql,
-            title=title,
+            sql=ReactiveStringOrNone(None),
+            title=ReactiveStringOrNone(None),
+            tables={},
             client=stub_client,
+            data_sources=data_sources or {},
+            current_table=ReactiveStringOrNone(None),
         )
 
-    # Real session requires data_source
-    if data_source is None:
+    # Real session requires data_sources and executor
+    if data_sources is None or executor is None:
         raise RuntimeError(
-            "data_source must be set before the real session. "
-            "Set it via the data_source property before users connect."
+            "At least one table must be registered before the session starts. "
+            "Call add_table() before server(), or pass the data to the QueryChat constructor."
         )
 
+    for name, source in data_sources.items():
+        table_states[name] = _make_table_state(source, executor)
+
     # Build the session-specific chat client through QueryChat.client(...).
     chat = build_chat_client()
 
     if has_viz_tool(tools):
         preload_viz_deps_server()
 
-    # Execute query when SQL changes
-    @reactive.calc
-    def filtered_df():
-        query = sql.get()
-        df = data_source.get_data() if not query else data_source.execute_query(query)
-        return df
-
     # Chat UI logic
     chat_ui = shinychat.Chat(CHAT_ID)
     ctrl = chatlas.StreamController()
@@ -258,17 +362,15 @@ async def _handle_greeting_requested():
     @reactive.event(input.chat_update)
     def _():
         update = input.chat_update()
-        if update is None:
-            return
-        if not isinstance(update, dict):
+        if update is None or not isinstance(update, dict):
             return
-
-        new_query = update.get("query")
-        new_title = update.get("title")
-        if new_query is not None:
-            sql.set(new_query)
-        if new_title is not None:
-            title.set(new_title)
+        table_name = update.get("table", "")
+        new_query = update.get("query") or None  # "" → None (reset)
+        new_title = update.get("title") or None
+        if table_name and table_name in table_states:
+            table_states[table_name].sql.set(new_query)
+            table_states[table_name].title.set(new_title)
+            _current_table.set(table_name)
 
     if enable_bookmarking:
         chat_ui.enable_bookmarking(chat)
@@ -277,8 +379,9 @@ def _():
         @session.bookmark.on_bookmark
         def _on_bookmark(x: BookmarkState) -> None:
             vals = x.values
-            vals["querychat_sql"] = sql.get()
-            vals["querychat_title"] = title.get()
+            for name, state in table_states.items():
+                vals[f"querychat_sql_{name}"] = state.sql.get()
+                vals[f"querychat_title_{name}"] = state.title.get()
             greeting_val = current_greeting.get()
             if greeting_val is not None:
                 vals["querychat_greeting"] = greeting_val
@@ -288,10 +391,16 @@ def _on_bookmark(x: BookmarkState) -> None:
         @session.bookmark.on_restore
         async def _on_restore(x: RestoreState) -> None:
             vals = x.values
-            if "querychat_sql" in vals:
-                sql.set(vals["querychat_sql"])
-            if "querychat_title" in vals:
-                title.set(vals["querychat_title"])
+            last_restored: str | None = None
+            for name, state in table_states.items():
+                if f"querychat_sql_{name}" in vals:
+                    state.sql.set(vals[f"querychat_sql_{name}"])
+                    if vals[f"querychat_sql_{name}"] is not None:
+                        last_restored = name
+                if f"querychat_title_{name}" in vals:
+                    state.title.set(vals[f"querychat_title_{name}"])
+            if last_restored is not None:
+                _current_table.set(last_restored)
             if "querychat_greeting" in vals:
                 current_greeting.set(vals["querychat_greeting"])
                 await chat_ui.set_greeting(
@@ -301,11 +410,45 @@ async def _on_restore(x: RestoreState) -> None:
                 )
             if "querychat_viz_widgets" in vals:
                 restored = restore_viz_widgets(
-                    data_source, vals["querychat_viz_widgets"]
+                    executor, vals["querychat_viz_widgets"]
                 )
                 viz_widgets[:] = restored
 
-    return ServerValues(df=filtered_df, sql=sql, title=title, client=chat)
+    if len(table_states) == 1:
+        only_state = next(iter(table_states.values()))
+        return ServerValues(
+            df=only_state.df,
+            sql=only_state.sql,
+            title=only_state.title,
+            tables=table_states,
+            client=chat,
+            data_sources=data_sources,
+            current_table=_current_table,
+        )
+
+    primary_name = next(iter(table_states))
+    primary_state = table_states[primary_name]
+    table_list = ", ".join(f"'{n}'" for n in table_states)
+
+    df_warned = False
+
+    @reactive.calc
+    def _multi_table_df() -> IntoFrameT:
+        nonlocal df_warned
+        if not df_warned:
+            df_warned = True
+            warn_multi_table_flat_accessor("df", primary_name, table_list)
+        return primary_state.df()
+
+    return ServerValues(
+        df=_multi_table_df,
+        sql=_MultiTableWarnReactive(primary_state.sql, "sql", primary_name, table_list),  # type: ignore[arg-type]
+        title=_MultiTableWarnReactive(primary_state.title, "title", primary_name, table_list),  # type: ignore[arg-type]
+        tables=table_states,
+        client=chat,
+        data_sources=data_sources,
+        current_table=_current_table,
+    )
 
 
 class GreetWarning(Warning):
@@ -313,7 +456,7 @@ class GreetWarning(Warning):
 
 
 def restore_viz_widgets(
-    data_source: DataSource[IntoFrameT],
+    executor: QueryExecutor,
     saved_widgets: list[VizWidgetEntry],
 ) -> list[VizWidgetEntry]:
     """Re-execute ggsql queries, register widgets, and return restored entries."""
@@ -327,7 +470,7 @@ def restore_viz_widgets(
         ggsql_str = entry["ggsql"]
         try:
             validated = validate(ggsql_str)
-            spec = execute_ggsql(data_source, validated)
+            spec = execute_ggsql(executor, validated)
             altair_widget = AltairWidget.from_ggsql(spec, widget_id=widget_id)
             register_widget(widget_id, altair_widget.widget)
             restored.append(entry)
diff --git a/pkg-py/src/querychat/_streamlit.py b/pkg-py/src/querychat/_streamlit.py
index b68a6effc..b8093b83f 100644
--- a/pkg-py/src/querychat/_streamlit.py
+++ b/pkg-py/src/querychat/_streamlit.py
@@ -13,6 +13,7 @@
     create_app_state,
     stream_response,
 )
+from ._table_accessor import TableAccessor
 from ._ui_assets import STREAMLIT_JS, SUGGESTION_CSS
 from ._utils import as_narwhals
 
@@ -25,6 +26,50 @@
     import sqlalchemy
     from narwhals.stable.v1.typing import IntoFrame
 
+    from ._data_dict import DataDict
+
+
+class StreamlitTableAccessor(TableAccessor):
+    """Per-table accessor for Streamlit QueryChat. Returned by ``qc.table(name)``."""
+
+    def __init__(self, querychat: QueryChat, table_name: str) -> None:
+        # Bypass TableAccessor.__init__ — this subclass owns df/sql/title entirely
+        # via session state, so _state is never used.
+        self._table_name = table_name
+        self._data_source = querychat._data_sources[table_name]
+        self._querychat_ref = querychat
+
+    def df(self) -> Any:
+        """
+        Get the current filtered data for this table.
+
+        Returns the full dataset when no SQL filter is active.
+        """
+        qc = self._querychat_ref
+        state = qc._get_state()
+        ts = state._table_states.get(self._table_name, {})
+        sql = ts.get("sql")
+        data_source = qc._data_sources[self._table_name]
+        if sql:
+            try:
+                executor = qc._require_query_executor("table.df")
+                return executor.execute_query(sql)
+            except Exception:
+                return data_source.get_data()
+        return data_source.get_data()
+
+    def sql(self) -> str | None:
+        """Return the current SQL filter for this table, or None."""
+        qc = self._querychat_ref
+        state = qc._get_state()
+        return state._table_states.get(self._table_name, {}).get("sql")
+
+    def title(self) -> str | None:
+        """Return the current filter title for this table, or None."""
+        qc = self._querychat_ref
+        state = qc._get_state()
+        return state._table_states.get(self._table_name, {}).get("title")
+
 
 class QueryChat(QueryChatBase[IntoFrameT]):
     """
@@ -61,16 +106,17 @@ class QueryChat(QueryChatBase[IntoFrameT]):
     @overload
     def __init__(
         self: QueryChat[Any],
-        data_source: None,
-        table_name: str,
+        data_source: None = None,
+        table_name: str | None = None,
         *,
         greeting: Optional[str | Path] = None,
         client: Optional[str | chatlas.Chat] = None,
         tools: TOOL_GROUPS | tuple[TOOL_GROUPS, ...] | None = ("filter", "query"),
-        data_description: Optional[str | Path] = None,
-        categorical_threshold: int = 20,
+        data_dict: DataDict | str | Path | None = None,
         extra_instructions: Optional[str | Path] = None,
         prompt_template: Optional[str | Path] = None,
+        categorical_threshold: int = 20,
+        data_description: Optional[str | Path] = None,
     ) -> None: ...
 
     @overload
@@ -82,10 +128,11 @@ def __init__(
         greeting: Optional[str | Path] = None,
         client: Optional[str | chatlas.Chat] = None,
         tools: TOOL_GROUPS | tuple[TOOL_GROUPS, ...] | None = ("filter", "query"),
-        data_description: Optional[str | Path] = None,
-        categorical_threshold: int = 20,
+        data_dict: DataDict | str | Path | None = None,
         extra_instructions: Optional[str | Path] = None,
         prompt_template: Optional[str | Path] = None,
+        categorical_threshold: int = 20,
+        data_description: Optional[str | Path] = None,
     ) -> None: ...
 
     @overload
@@ -97,10 +144,11 @@ def __init__(
         greeting: Optional[str | Path] = None,
         client: Optional[str | chatlas.Chat] = None,
         tools: TOOL_GROUPS | tuple[TOOL_GROUPS, ...] | None = ("filter", "query"),
-        data_description: Optional[str | Path] = None,
-        categorical_threshold: int = 20,
+        data_dict: DataDict | str | Path | None = None,
         extra_instructions: Optional[str | Path] = None,
         prompt_template: Optional[str | Path] = None,
+        categorical_threshold: int = 20,
+        data_description: Optional[str | Path] = None,
     ) -> None: ...
 
     @overload
@@ -112,10 +160,11 @@ def __init__(
         greeting: Optional[str | Path] = None,
         client: Optional[str | chatlas.Chat] = None,
         tools: TOOL_GROUPS | tuple[TOOL_GROUPS, ...] | None = ("filter", "query"),
-        data_description: Optional[str | Path] = None,
-        categorical_threshold: int = 20,
+        data_dict: DataDict | str | Path | None = None,
         extra_instructions: Optional[str | Path] = None,
         prompt_template: Optional[str | Path] = None,
+        categorical_threshold: int = 20,
+        data_description: Optional[str | Path] = None,
     ) -> None: ...
 
     @overload
@@ -127,24 +176,26 @@ def __init__(
         greeting: Optional[str | Path] = None,
         client: Optional[str | chatlas.Chat] = None,
         tools: TOOL_GROUPS | tuple[TOOL_GROUPS, ...] | None = ("filter", "query"),
-        data_description: Optional[str | Path] = None,
-        categorical_threshold: int = 20,
+        data_dict: DataDict | str | Path | None = None,
         extra_instructions: Optional[str | Path] = None,
         prompt_template: Optional[str | Path] = None,
+        categorical_threshold: int = 20,
+        data_description: Optional[str | Path] = None,
     ) -> None: ...
 
     def __init__(
         self,
-        data_source: IntoFrame | sqlalchemy.Engine | ibis.Table | None,
-        table_name: str,
+        data_source: IntoFrame | sqlalchemy.Engine | ibis.Table | None = None,
+        table_name: str | None = None,
         *,
         greeting: Optional[str | Path] = None,
         client: Optional[str | chatlas.Chat] = None,
         tools: TOOL_GROUPS | tuple[TOOL_GROUPS, ...] | None = ("filter", "query"),
-        data_description: Optional[str | Path] = None,
-        categorical_threshold: int = 20,
+        data_dict: DataDict | str | Path | None = None,
         extra_instructions: Optional[str | Path] = None,
         prompt_template: Optional[str | Path] = None,
+        categorical_threshold: int = 20,
+        data_description: Optional[str | Path] = None,
     ):
         super().__init__(
             data_source,
@@ -153,25 +204,27 @@ def __init__(
             client=client,
             tools=tools,
             data_description=data_description,
+            data_dict=data_dict,
             categorical_threshold=categorical_threshold,
             extra_instructions=extra_instructions,
             prompt_template=prompt_template,
         )
-        self._state_key = f"_querychat_{table_name}"
+        self._state_key = f"_querychat_{table_name}" if table_name else "_querychat"
 
     def _get_state(self) -> AppState:
         """Get or create session state."""
-        data_source = self._require_data_source("_get_state")
+        self._require_initialized("_get_state")
         import streamlit as st
 
         if self._state_key not in st.session_state:
             st.session_state[self._state_key] = create_app_state(
-                data_source,
-                lambda update_cb, reset_cb: self.client(
+                data_sources=dict(self._data_sources),
+                client_factory=lambda update_cb, reset_cb: self.client(
                     update_dashboard=update_cb,
                     reset_dashboard=reset_cb,
                 ),
-                self.greeting,
+                greeting=self.greeting,
+                query_executor=self._require_query_executor("_get_state"),
             )
         return st.session_state[self._state_key]
 
@@ -182,11 +235,18 @@ def app(self) -> None:
         Configures the page, renders chat in sidebar, and displays
         SQL query and data table in the main area.
         """
-        data_source = self._require_data_source("app")
+        self._require_initialized("app")
+        if len(self._data_sources) > 1:
+            table_list = ", ".join(f"'{n}'" for n in self._data_sources)
+            raise RuntimeError(
+                f"app() does not support multiple tables ({table_list}). "
+                "Build a custom layout using sidebar(), ui(), and table('name') instead."
+            )
         import streamlit as st
 
+        table_name = next(iter(self._data_sources))
         st.set_page_config(
-            page_title=f"querychat with {data_source.table_name}",
+            page_title=f"querychat with {table_name}",
             layout="wide",
             initial_sidebar_state="expanded",
         )
@@ -270,16 +330,32 @@ def df(self) -> IntoFrameT:
         eager sources, a LazyFrame for Polars lazy sources, or an Ibis Table
         for Ibis sources. Callers needing an eager DataFrame should collect
         the result (e.g., via ``as_narwhals(qc.df())``).
+
+        Raises ``AttributeError`` when multiple tables are registered;
+        use ``qc.table('name').df()`` instead.
         """
+        self._require_single_table("df")
         # Cast is safe because get_current_data() returns the same type as the data source
         return cast("IntoFrameT", self._get_state().get_current_data())
 
     def sql(self) -> str | None:
-        """Get the current SQL query, or None if using default."""
+        """
+        Get the current SQL query, or None if using default.
+
+        Raises ``AttributeError`` when multiple tables are registered;
+        use ``qc.table('name').sql()`` instead.
+        """
+        self._require_single_table("sql")
         return self._get_state().sql
 
     def title(self) -> str | None:
-        """Get the current query title, or None if using default."""
+        """
+        Get the current query title, or None if using default.
+
+        Raises ``AttributeError`` when multiple tables are registered;
+        use ``qc.table('name').title()`` instead.
+        """
+        self._require_single_table("title")
         return self._get_state().title
 
     def reset(self) -> None:
@@ -305,12 +381,13 @@ def reset(self) -> None:
 
     def _render_main_content(self) -> None:
         """Render the main content area (SQL + data table)."""
-        data_source = self._require_data_source("_render_main_content")
+        self._require_initialized("_render_main_content")
         import streamlit as st
 
         state = self._get_state()
+        table_name = next(iter(self._data_sources))
 
-        st.title(f"querychat with `{data_source.table_name}`")
+        st.title(f"querychat with `{table_name}`")
 
         st.subheader(state.title or "SQL Query")
 
@@ -331,3 +408,24 @@ def _render_main_content(self) -> None:
             df.to_native(), use_container_width=True, height=400, hide_index=True
         )
         st.caption(f"Data has {df.shape[0]} rows and {df.shape[1]} columns.")
+
+    def table(self, name: str) -> StreamlitTableAccessor:
+        """
+        Return a per-table accessor for the given table name.
+
+        Parameters
+        ----------
+        name
+            Table name (must be one of ``qc.table_names()``).
+
+        Raises
+        ------
+        ValueError
+            If ``name`` is not a registered table.
+
+        """
+        if name not in self._data_sources:
+            raise ValueError(
+                f"Table '{name}' not found. Available tables: {self.table_names()}"
+            )
+        return StreamlitTableAccessor(self, name)
diff --git a/pkg-py/src/querychat/_system_prompt.py b/pkg-py/src/querychat/_system_prompt.py
index f690a0696..a7e17d6cc 100644
--- a/pkg-py/src/querychat/_system_prompt.py
+++ b/pkg-py/src/querychat/_system_prompt.py
@@ -1,16 +1,16 @@
 from __future__ import annotations
 
-import re
+import warnings
 from pathlib import Path
 from typing import TYPE_CHECKING
 
 import chevron
+import yaml
 
 from ._viz_utils import has_viz_tool
 
-_SCHEMA_TAG_RE = re.compile(r"\{\{[{#^/]?\s*schema\b")
-
 if TYPE_CHECKING:
+    from ._data_dict import DataDict
     from ._datasource import DataSource
 
 
@@ -19,47 +19,106 @@ class QueryChatSystemPrompt:
 
     def __init__(
         self,
-        prompt_template: str | Path,
-        data_source: DataSource,
+        *,
+        prompt_template: str | Path | None,
+        data_source: DataSource | None = None,
+        data_sources: dict[str, DataSource] | None = None,
         data_description: str | Path | None = None,
         extra_instructions: str | Path | None = None,
-        categorical_threshold: int = 10,
+        categorical_threshold: int = 20,
+        data_dicts: list[DataDict] | None = None,
     ):
-        """
-        Initialize with prompt components.
-
-        Args:
-            prompt_template: Mustache template string or path to template file
-            data_source: DataSource instance for schema generation
-            data_description: Optional data context (string or path)
-            extra_instructions: Optional custom LLM instructions (string or path)
-            categorical_threshold: Threshold for categorical column detection
-
-        """
-        if isinstance(prompt_template, Path):
-            self.template = prompt_template.read_text()
-        else:
-            self.template = prompt_template
-
-        if isinstance(data_description, Path):
-            self.data_description = data_description.read_text()
+        if data_sources is not None:
+            self._data_sources = data_sources
+        elif data_source is not None:
+            self._data_sources = {data_source.table_name: data_source}
         else:
-            self.data_description = data_description
+            raise ValueError("Either data_source or data_sources must be provided")
 
-        if isinstance(extra_instructions, Path):
-            self.extra_instructions = extra_instructions.read_text()
-        else:
-            self.extra_instructions = extra_instructions
+        self._data_dicts: list[DataDict] = data_dicts or []
 
-        if _SCHEMA_TAG_RE.search(self.template):
-            self.schema = data_source.get_schema(
-                categorical_threshold=categorical_threshold
+        if len(self._data_sources) > 1 and not self._data_dicts:
+            warnings.warn(
+                "Multiple tables registered without a data_dict. "
+                "Providing a data_dict with table descriptions and relationships "
+                "gives the LLM better context for multi-table queries.",
+                UserWarning,
+                stacklevel=3,
             )
-        else:
-            self.schema = ""
 
+        if prompt_template is None:
+            prompt_template = Path(__file__).parent / "prompts" / "prompt.md"
+        self.template = (
+            prompt_template.read_text()
+            if isinstance(prompt_template, Path)
+            else prompt_template
+        )
+
+        self.data_description = (
+            data_description.read_text()
+            if isinstance(data_description, Path)
+            else data_description
+        )
+        self.extra_instructions = (
+            extra_instructions.read_text()
+            if isinstance(extra_instructions, Path)
+            else extra_instructions
+        )
         self.categorical_threshold = categorical_threshold
-        self.data_source = data_source
+
+    def _generate_tables_overview(self) -> str:
+        lines = []
+        for name, source in self._data_sources.items():
+            desc: str | None = source.get_data_description() or None
+            if desc and not self.data_description:
+                lines.append(f"- {name}: {desc}")
+            else:
+                lines.append(f"- {name}")
+        return "\n".join(lines)
+
+    def _generate_data_dicts_yaml(self) -> str:
+        def escape_attr(val: str) -> str:
+            return val.replace('"', "&quot;")
+
+        blocks: list[str] = []
+        all_claimed: set[str] = set()
+
+        for dd in self._data_dicts:
+            d = dd.to_prompt_dict()
+            # Name and description belong in the XML tag, not the YAML body
+            d.pop("name", None)
+            d.pop("description", None)
+
+            claimed = {n for n in self._data_sources if n in dd.tables}
+            all_claimed.update(claimed)
+            if "tables" in d:
+                d["tables"] = {
+                    n: v for n, v in d["tables"].items() if n in self._data_sources
+                }
+                if not d["tables"]:
+                    del d["tables"]
+
+            attrs = f'name="{escape_attr(dd.name)}"' if dd.name else ""
+            if dd.description:
+                attrs += f' description="{escape_attr(dd.description)}"'
+
+            body = yaml.dump(d, default_flow_style=False, allow_unicode=True, sort_keys=False).rstrip() if d else ""
+            blocks.append(f"<data-dict {attrs}>\n{body}\n</data-dict>" if body else f"<data-dict {attrs}/>")
+
+        unclaimed = [n for n in self._data_sources if n not in all_claimed]
+        if unclaimed:
+            tables: dict = {}
+            for name in unclaimed:
+                desc = (
+                    self._data_sources[name].get_data_description() or None
+                    if not self.data_description
+                    else None
+                )
+                tables[name] = {"description": desc} if desc else None
+            yaml_str = yaml.dump({"tables": tables}, default_flow_style=False, allow_unicode=True, sort_keys=False).rstrip()
+            blocks.append(f"<tables>\n{yaml_str}\n</tables>")
+
+        return "\n\n".join(blocks)
 
     def render(self, tools: set[str] | None) -> str:
         """
@@ -72,20 +131,24 @@ def render(self, tools: set[str] | None) -> str:
             Fully rendered system prompt string
 
         """
-        db_type = self.data_source.get_db_type()
-        is_duck_db = db_type.lower() == "duckdb"
+        first_source = next(iter(self._data_sources.values()))
+        db_type = first_source.get_db_type()
+        has_dicts = bool(self._data_dicts)
 
         context = {
             "db_type": db_type,
-            "is_duck_db": is_duck_db,
-            "semantic_views": self.data_source.get_semantic_views_description(),
-            "schema": self.schema,
+            "is_duck_db": db_type.lower() == "duckdb",
+            "semantic_views": first_source.get_semantic_views_description(),
+            "has_data_dicts": has_dicts,
+            "data_dicts": self._generate_data_dicts_yaml() if has_dicts else "",
+            "tables_overview": "" if has_dicts else self._generate_tables_overview(),
             "data_description": self.data_description,
             "extra_instructions": self.extra_instructions,
             "has_tool_update": "update" in tools if tools else False,
             "has_tool_query": "query" in tools if tools else False,
             "has_tool_visualize": has_viz_tool(tools),
             "include_query_guidelines": len(tools or ()) > 0,
+            "multi_table": len(self._data_sources) > 1,
         }
 
         prompts_dir = str(Path(__file__).parent / "prompts")
@@ -95,3 +158,10 @@ def render(self, tools: set[str] | None) -> str:
             partials_path=prompts_dir,
             partials_ext="md",
         )
+
+    @property
+    def data_source(self) -> DataSource:
+        """Return single data source for backwards compatibility."""
+        if len(self._data_sources) == 1:
+            return next(iter(self._data_sources.values()))
+        raise ValueError("Multiple data sources present; use _data_sources instead")
diff --git a/pkg-py/src/querychat/_table_accessor.py b/pkg-py/src/querychat/_table_accessor.py
new file mode 100644
index 000000000..f2dbb380e
--- /dev/null
+++ b/pkg-py/src/querychat/_table_accessor.py
@@ -0,0 +1,62 @@
+"""TableAccessor class for accessing per-table state and data."""
+
+from __future__ import annotations
+
+from typing import TYPE_CHECKING, Any
+
+if TYPE_CHECKING:
+    from ._datasource import DataSource
+
+
+class TableAccessor:
+    """
+    Accessor for a specific table's reactive state and data.
+
+    Returned by ``qc_vals.table("name")`` in Shiny server callbacks, and by
+    ``qc.table("name")`` in Streamlit. Provides ``df()``, ``sql()``, and
+    ``title()`` backed by per-session reactive state.
+
+    Parameters
+    ----------
+    table_name
+        The name of the table this accessor represents.
+    data_source
+        The DataSource for this table.
+    state
+        Per-table reactive state, wired up by the framework.
+
+    """
+
+    def __init__(
+        self,
+        table_name: str,
+        data_source: DataSource,
+        *,
+        state: Any,
+    ):
+        self._table_name = table_name
+        self._data_source = data_source
+        self._state = state
+
+    @property
+    def table_name(self) -> str:
+        """The name of this table."""
+        return self._table_name
+
+    @property
+    def data_source(self) -> DataSource:
+        """The data source for this table."""
+        return self._data_source
+
+    def df(self) -> Any:
+        """Return the current filtered data for this table (reactive)."""
+        return self._state.df()
+
+    def sql(self) -> str | None:
+        """Return the current SQL filter for this table (reactive)."""
+        return self._state.sql.get()
+
+    def title(self) -> str | None:
+        """Return the current filter title for this table (reactive)."""
+        return self._state.title.get()
+
diff --git a/pkg-py/src/querychat/_viz_ggsql.py b/pkg-py/src/querychat/_viz_ggsql.py
index 076b4f3b3..9e166c151 100644
--- a/pkg-py/src/querychat/_viz_ggsql.py
+++ b/pkg-py/src/querychat/_viz_ggsql.py
@@ -10,20 +10,20 @@
 if TYPE_CHECKING:
     import ggsql
 
-    from ._datasource import DataSource
+    from ._query_executor import QueryExecutor
 
 
-def execute_ggsql(data_source: DataSource, validated: ggsql.Validated) -> ggsql.Spec:
+def execute_ggsql(executor: QueryExecutor, validated: ggsql.Validated) -> ggsql.Spec:
     """
-    Execute a pre-validated ggsql query against a DataSource, returning a Spec.
+    Execute a pre-validated ggsql query against a QueryExecutor, returning a Spec.
 
-    Executes the SQL portion through DataSource (preserving database pushdown),
+    Executes the SQL portion through the executor (preserving database pushdown),
     then feeds the result into a ggsql DuckDBReader to produce a Spec.
 
     Parameters
     ----------
-    data_source
-        The querychat DataSource to execute the SQL portion against.
+    executor
+        The querychat QueryExecutor to execute the SQL portion against.
     validated
         A pre-validated ggsql query (from ``ggsql.validate()``).
 
@@ -47,7 +47,7 @@ def execute_ggsql(data_source: DataSource, validated: ggsql.Validated) -> ggsql.
             "result."
         )
 
-    pl_df = to_polars(data_source.execute_query(validated.sql()))
+    pl_df = to_polars(executor.execute_query(validated.sql()))
 
     reader = DuckDBReader("duckdb://memory")
     table = extract_visualise_table(visual)
diff --git a/pkg-py/src/querychat/_viz_tools.py b/pkg-py/src/querychat/_viz_tools.py
index 19833eb77..c57b297c0 100644
--- a/pkg-py/src/querychat/_viz_tools.py
+++ b/pkg-py/src/querychat/_viz_tools.py
@@ -28,7 +28,7 @@
     import altair as alt
     from ipywidgets.widgets.widget import Widget
 
-    from ._datasource import DataSource
+    from ._query_executor import QueryExecutor
 
 
 class VisualizeData(TypedDict):
@@ -56,18 +56,22 @@ class VisualizeData(TypedDict):
 
 
 def tool_visualize(
-    data_source: DataSource,
+    executor: QueryExecutor,
     update_fn: Callable[[VisualizeData], None],
+    *,
+    multi_table: bool = False,
 ) -> Tool:
     """
     Create a tool that executes a ggsql query and renders the visualization.
 
     Parameters
     ----------
-    data_source
-        The data source to query against
+    executor
+        The query executor to query against
     update_fn
         Callback function to call with VisualizeData when visualization succeeds
+    multi_table
+        Whether multiple tables are registered.
 
     Returns
     -------
@@ -75,10 +79,11 @@ def tool_visualize(
         A tool that can be registered with chatlas
 
     """
-    impl = visualize_impl(data_source, update_fn)
+    impl = visualize_impl(executor, update_fn)
     impl.__doc__ = read_prompt_template(
         "tool-visualize.md",
-        db_type=data_source.get_db_type(),
+        db_type=executor.get_db_type(),
+        multi_table=multi_table,
     )
 
     return Tool.from_func(
@@ -147,7 +152,7 @@ def __init__(
 
 
 def visualize_impl(
-    data_source: DataSource,
+    executor: QueryExecutor,
     update_fn: Callable[[VisualizeData], None],
 ) -> Callable[[str, str], ContentToolResult]:
     """Create the visualize implementation function."""
@@ -173,7 +178,7 @@ def visualize(
                     "\n".join(error["message"] for error in validated.errors())
                 )
 
-            spec = execute_ggsql(data_source, validated)
+            spec = execute_ggsql(executor, validated)
 
             raw_chart = VegaLiteWriter().render_chart(spec)
             altair_widget = AltairWidget(copy.deepcopy(raw_chart))
diff --git a/pkg-py/src/querychat/prompts/prompt.md b/pkg-py/src/querychat/prompts/prompt.md
index 00272cada..08b0c93f7 100644
--- a/pkg-py/src/querychat/prompts/prompt.md
+++ b/pkg-py/src/querychat/prompts/prompt.md
@@ -1,20 +1,26 @@
 You are a data dashboard chatbot that operates in a sidebar interface. Your role is to help users interact with their data through filtering, sorting, and answering questions.{{#has_tool_visualize}} You can also help them explore data visually.{{/has_tool_visualize}}
 
-You have access to a {{db_type}} SQL database with the following schema:
+You have access to a {{db_type}} SQL database with the following tables:
 
-<database_schema>
-{{schema}}
-</database_schema>
+{{#has_data_dicts}}
+{{{data_dicts}}}
 
-{{#data_description}}
-Here is additional information about the data:
+{{/has_data_dicts}}
+{{^has_data_dicts}}
+<tables>
+{{{tables_overview}}}
+</tables>
 
+{{/has_data_dicts}}
+{{#data_description}}
 <data_description>
 {{data_description}}
 </data_description>
+
 {{/data_description}}
+Always call `querychat_get_schema` before writing SQL against any table you haven't retrieved schema for in this conversation. Do not infer column names from table names, variable names, or the system prompt alone — verify the actual schema first, then write the query.
 
-For security reasons, you may only query this specific table.
+For security reasons, you may only query {{#multi_table}}these specific tables{{/multi_table}}{{^multi_table}}this specific table{{/multi_table}}.
 
 {{#include_query_guidelines}}
 ## SQL Query Guidelines
@@ -82,18 +88,19 @@ You can handle these types of requests:
 When the user asks you to filter or sort the dashboard, e.g. "Show me..." or "Which ____ have the highest ____?" or "Filter to only include ____":
 
 - Write a {{db_type}} SQL SELECT query
-- Call `querychat_update_dashboard` with the query and a descriptive title
-- The query MUST return all columns from the schema (you can use `SELECT *`)
+- Call `querychat_update_dashboard` with the query, table name, and a descriptive title
+- You MUST specify the `table` parameter to indicate which table to filter
+- The query MUST return all columns from the specified table's schema (you can use `SELECT *`)
 - Use a single SQL query even if complex (subqueries and CTEs are fine)
 - Optimize for **readability over efficiency**
 - Include SQL comments to explain complex logic
 - No confirmation messages are needed: the user will see your query in the dashboard.
 
-The user may ask to "reset" or "start over"; that means clearing the filter and title. Do this by calling `querychat_reset_dashboard()`.
+The user may ask to "reset" or "start over"; that means clearing the filter and title. Do this by calling `querychat_reset_dashboard` with the relevant `table`.
 
 **Filtering Example:**
 User: "Show only rows where sales are above average"
-Tool Call: `querychat_update_dashboard({query: "SELECT * FROM table WHERE sales > (SELECT AVG(sales) FROM table)", title: "Above average sales"})`
+Tool Call: `querychat_update_dashboard({query: "SELECT * FROM sales_data WHERE sales > (SELECT AVG(sales) FROM sales_data)", table: "sales_data", title: "Above average sales"})`
 Response: ""
 
 No further response needed, the user will see the updated dashboard.
@@ -125,7 +132,7 @@ You can create visualizations using the `querychat_visualize` tool, which uses g
 
 #### Visualization best practices
 
-The database schema in this prompt includes column names, types, and summary statistics. {{#has_tool_query}}If that context isn't sufficient for a confident visualization — e.g., you're unsure about value distributions, need to check for NULLs, or want to gauge row counts before choosing a chart type — use the `querychat_query` tool to inspect the data before visualizing. Always pass `collapsed=true` for these preparatory queries so the chart remains the focal point of the response.{{/has_tool_query}}
+Use the `querychat_get_schema` tool to retrieve column names, types, and summary statistics for a table before writing visualization queries. {{#has_tool_query}}If that context isn't sufficient for a confident visualization — e.g., you're unsure about value distributions, need to check for NULLs, or want to gauge row counts before choosing a chart type — use the `querychat_query` tool to inspect the data before visualizing. Always pass `collapsed=true` for these preparatory queries so the chart remains the focal point of the response.{{/has_tool_query}}
 
 Follow the principles below to produce clear, interpretable charts.
 
diff --git a/pkg-py/src/querychat/prompts/tool-get-schema.md b/pkg-py/src/querychat/prompts/tool-get-schema.md
new file mode 100644
index 000000000..f34697223
--- /dev/null
+++ b/pkg-py/src/querychat/prompts/tool-get-schema.md
@@ -0,0 +1,18 @@
+Retrieve full column details for a table
+
+Returns column names, types, value ranges, categorical values, and descriptions for the specified table.
+
+**When to use this tool:**
+
+- Before writing any SQL query involving a table you have not yet inspected
+- When you are unsure which table is most relevant to the user's request — call this tool on candidate tables to understand their contents before deciding
+
+Parameters
+----------
+table_name
+    The name of the table to retrieve schema for. Must match one of the table names shown in the system prompt.
+
+Returns
+-------
+:
+    Full column details for the specified table, including column names, types, value ranges, categorical values, and descriptions.
diff --git a/pkg-py/src/querychat/prompts/tool-query.md b/pkg-py/src/querychat/prompts/tool-query.md
index 65bc7d899..bd8954738 100644
--- a/pkg-py/src/querychat/prompts/tool-query.md
+++ b/pkg-py/src/querychat/prompts/tool-query.md
@@ -25,6 +25,11 @@ Always use SQL for counting, averaging, summing, and other calculations—NEVER
 - When using `collapsed=false`, avoid duplicating the same rows/values in both the tool result and your response text
 - Do not reproduce large result sets in your response — summarize the key takeaways instead
 
+{{#multi_table}}
+
+**Multi-table queries:** Your schema includes multiple tables. You can reference any table in your queries and use JOINs when the data spans tables. Use the relationships described in the schema to determine join conditions.
+
+{{/multi_table}}
 Parameters
 ----------
 query :
diff --git a/pkg-py/src/querychat/prompts/tool-reset-dashboard.md b/pkg-py/src/querychat/prompts/tool-reset-dashboard.md
index 7d78b4b43..a44d0a7f1 100644
--- a/pkg-py/src/querychat/prompts/tool-reset-dashboard.md
+++ b/pkg-py/src/querychat/prompts/tool-reset-dashboard.md
@@ -2,9 +2,14 @@ Reset the dashboard to its original state
 
 Resets the dashboard to use the original unfiltered dataset and clears any custom title.
 
-If the user asks to reset the dashboard, simply call this tool with no other response. The reset action will be obvious to the user.
+If the user asks to reset the dashboard, call this tool with the relevant table name and no other response. The reset action will be obvious to the user.
 
-If the user asks to start over, call this tool and then provide a new set of suggestions for next steps. Include suggestions that encourage exploration of the data in new directions.
+If the user asks to start over, call this tool with the relevant table name and then provide a new set of suggestions for next steps. Include suggestions that encourage exploration of the data in new directions.
+
+Parameters
+----------
+table
+    The name of the table to reset.
 
 Returns
 -------
diff --git a/pkg-py/src/querychat/prompts/tool-update-dashboard.md b/pkg-py/src/querychat/prompts/tool-update-dashboard.md
index dae9861c0..809c3b447 100644
--- a/pkg-py/src/querychat/prompts/tool-update-dashboard.md
+++ b/pkg-py/src/querychat/prompts/tool-update-dashboard.md
@@ -2,6 +2,8 @@ Filter and sort the dashboard data
 
 This tool executes a {{db_type}} SQL SELECT query to filter or sort the data used in the dashboard.
 
+The `table` parameter specifies which table to filter. Use the table name exactly as shown in the schema.
+
 **When to use:** Call this tool whenever the user requests filtering, sorting, or data manipulation on the dashboard with questions like "Show me..." or "Which records have...". This tool is appropriate for any request that involves showing a subset of the data or reordering it.
 
 **When not to use:** Do NOT use this tool for general questions about the data that can be answered with a single value or summary statistic. For those questions, use the `querychat_query` tool instead.
@@ -14,8 +16,15 @@ This tool executes a {{db_type}} SQL SELECT query to filter or sort the data use
 - Assume the user will only see the original columns in the dataset
 
 
+{{#multi_table}}
+
+**Multi-table filters:** When filtering a table, you may reference other tables in WHERE clauses, subqueries, or CTEs (e.g., filtering orders by a condition on customers). The result must still return all columns of the target table specified by the `table` parameter.
+
+{{/multi_table}}
 Parameters
 ----------
+table :
+    The name of the table to filter. Must match exactly one of the table names from the schema.
 query :
     A {{db_type}} SQL SELECT query that MUST return all existing schema columns (use SELECT * or explicitly list all columns). May include additional computed columns, subqueries, CTEs, WHERE clauses, ORDER BY, and any {{db_type}}-supported SQL functions.
 title :
diff --git a/pkg-py/src/querychat/prompts/tool-visualize.md b/pkg-py/src/querychat/prompts/tool-visualize.md
index c43f4da4d..4475cd3ef 100644
--- a/pkg-py/src/querychat/prompts/tool-visualize.md
+++ b/pkg-py/src/querychat/prompts/tool-visualize.md
@@ -10,6 +10,11 @@ Render a ggsql query (SQL with a VISUALISE clause) as an Altair chart displayed
 - Do NOT include `LABEL title => ...` in the query — use the `title` parameter instead.
 - If a visualization fails, read the error message carefully and retry with a corrected query. Common fixes: correcting column names, adding `SCALE DISCRETE` for integer categories, moving SQL expressions out of `VISUALISE` into the `SELECT` clause, and using `DRAW range` for interval-style marks instead of deprecated `errorbar`.{{#has_tool_query}} If the error persists, fall back to `querychat_query` for a tabular answer.{{/has_tool_query}}
 
+{{#multi_table}}
+
+**Multi-table queries:** The SELECT portion of your ggsql query can reference any table from the schema and use JOINs.
+
+{{/multi_table}}
 Parameters
 ----------
 ggsql :
diff --git a/pkg-py/src/querychat/static/js/querychat.js b/pkg-py/src/querychat/static/js/querychat.js
index 18d6b4f45..58f7e3ba4 100644
--- a/pkg-py/src/querychat/static/js/querychat.js
+++ b/pkg-py/src/querychat/static/js/querychat.js
@@ -9,11 +9,11 @@
     if (!chatContainer) return;
 
     const chatId = chatContainer.id;
-    const { query, title } = event.target.dataset;
+    const { query, title, table } = event.target.dataset;
 
     window.Shiny.setInputValue(
       chatId + "_update",
-      { query, title },
+      { query, title, table },
       { priority: "event" }
     );
   });
diff --git a/pkg-py/src/querychat/static/js/schema-display.js b/pkg-py/src/querychat/static/js/schema-display.js
new file mode 100644
index 000000000..b21376c6c
--- /dev/null
+++ b/pkg-py/src/querychat/static/js/schema-display.js
@@ -0,0 +1,154 @@
+/* Generated file. Source: js/src/schema-display.js. Do not edit directly. */
+
+"use strict";
+(() => {
+  // src/schema-display.js
+  var lastDisplay = null;
+  var lastDisplayTime = 0;
+  var BATCH_MS = 1e3;
+  var activePanel = null;
+  function parseColumnsJson(json) {
+    return JSON.parse(json).map((col) => ({
+      name: col.name,
+      type: col.sql_type,
+      units: col.units || null,
+      description: col.description || null,
+      constraints: col.constraints && col.constraints.length > 0 ? col.constraints.join(", ") : null,
+      range: col.min_val != null && col.max_val != null ? `${col.min_val} to ${col.max_val}` : null,
+      categories: col.categories && col.categories.length > 0 ? col.categories.map((v) => `'${v}'`).join(", ") : null
+    }));
+  }
+  function esc(s) {
+    return String(s).replace(/&/g, "&amp;").replace(/</g, "&lt;").replace(/>/g, "&gt;").replace(/"/g, "&quot;");
+  }
+  var TH = "padding:0.35em 0.75em;text-align:left;white-space:nowrap;font-weight:600;border-bottom:2px solid var(--bs-border-color,#dee2e6);background:var(--bs-tertiary-bg,#f8f9fa);position:sticky;top:0;z-index:1;";
+  var TD_MONO = "padding:0.3em 0.75em;white-space:nowrap;font-family:var(--bs-font-monospace,monospace);font-size:0.875em;border-bottom:1px solid var(--bs-border-color-translucent,rgba(0,0,0,.08));";
+  var TD_WRAP = "padding:0.3em 0.75em;max-width:22em;overflow-wrap:break-word;border-bottom:1px solid var(--bs-border-color-translucent,rgba(0,0,0,.08));";
+  var TD_NOWRAP = "padding:0.3em 0.75em;white-space:nowrap;border-bottom:1px solid var(--bs-border-color-translucent,rgba(0,0,0,.08));";
+  function renderTable(columns) {
+    const rows = columns.map((col) => {
+      let typeCell = esc(col.type);
+      if (col.units) {
+        typeCell += ` <span style="color:var(--bs-secondary-color,#6c757d)">[${esc(col.units)}]</span>`;
+      }
+      const details = col.range ? esc(col.range) : col.categories ? esc(col.categories) : "";
+      return `<tr><td style="${TD_MONO}">${esc(col.name)}</td><td style="${TD_MONO}">${typeCell}</td><td style="${TD_WRAP}">${col.description ? esc(col.description) : ""}</td><td style="${TD_NOWRAP}">${col.constraints ? esc(col.constraints) : ""}</td><td style="${TD_WRAP}">${details}</td></tr>`;
+    }).join("");
+    return `<table style="border-collapse:collapse;min-width:100%;width:max-content;font-size:0.875em;"><thead><tr><th style="${TH}">Column</th><th style="${TH}">Type</th><th style="${TH}">Description</th><th style="${TH}">Constraints</th><th style="${TH}">Range / Values</th></tr></thead><tbody>${rows}</tbody></table>`;
+  }
+  var PANEL_STYLE = "position:fixed;z-index:9999;background:var(--bs-body-bg,#fff);color:var(--bs-body-color,#212529);border:1px solid var(--bs-border-color,#dee2e6);border-radius:var(--bs-border-radius,0.375rem);box-shadow:0 4px 16px rgba(0,0,0,.15);overflow:auto;max-height:min(420px,60vh);";
+  function positionPanel(btn, panel) {
+    const rect = btn.getBoundingClientRect();
+    const vw = window.innerWidth;
+    const vh = window.innerHeight;
+    const pw = Math.min(Math.max(360, vw * 0.55), vw - 16);
+    panel.style.width = `${pw}px`;
+    panel.style.left = `${Math.max(8, Math.min(rect.left, vw - pw - 8))}px`;
+    const spaceBelow = vh - rect.bottom - 8;
+    const spaceAbove = rect.top - 8;
+    if (spaceBelow >= 120 || spaceBelow >= spaceAbove) {
+      panel.style.top = `${rect.bottom + 4}px`;
+    } else {
+      const panelH = Math.min(420, spaceAbove);
+      panel.style.top = `${Math.max(8, rect.top - panelH - 4)}px`;
+    }
+  }
+  function closePanel() {
+    if (activePanel) {
+      activePanel.panel.hidden = true;
+      activePanel.btn.setAttribute("aria-expanded", "false");
+      activePanel = null;
+    }
+  }
+  document.addEventListener("click", closePanel);
+  document.addEventListener("keydown", (e) => {
+    if (e.key === "Escape") closePanel();
+  });
+  window.addEventListener(
+    "scroll",
+    (e) => {
+      if (activePanel && !activePanel.panel.contains(
+        /** @type {Node} */
+        e.target
+      )) {
+        closePanel();
+      }
+    },
+    true
+  );
+  window.addEventListener("resize", closePanel);
+  function createBtn(tableName, columnsJson) {
+    const columns = parseColumnsJson(columnsJson);
+    const btn = document.createElement("button");
+    btn.type = "button";
+    btn.style.cssText = "background:none;border:none;padding:0;color:inherit;text-decoration:underline dotted;cursor:pointer;font-size:inherit;border-radius:2px;";
+    btn.textContent = tableName;
+    btn.setAttribute("aria-label", `Show schema for ${tableName}`);
+    btn.setAttribute("aria-expanded", "false");
+    btn.setAttribute("aria-haspopup", "dialog");
+    const panel = document.createElement("div");
+    panel.setAttribute("role", "dialog");
+    panel.setAttribute("aria-label", `${tableName} schema`);
+    panel.style.cssText = PANEL_STYLE;
+    panel.hidden = true;
+    panel.innerHTML = renderTable(columns);
+    document.body.appendChild(panel);
+    btn.addEventListener("click", (e) => {
+      e.stopPropagation();
+      if (activePanel && activePanel.panel === panel) {
+        closePanel();
+        return;
+      }
+      closePanel();
+      positionPanel(btn, panel);
+      panel.hidden = false;
+      btn.setAttribute("aria-expanded", "true");
+      activePanel = { btn, panel };
+    });
+    panel.addEventListener("click", (e) => e.stopPropagation());
+    return btn;
+  }
+  var style = document.createElement("style");
+  style.textContent = ".qc-schema-display button:focus-visible{outline:2px solid currentColor;outline-offset:2px;border-radius:2px}";
+  document.head.appendChild(style);
+  function processCollector(sentinel) {
+    const now = Date.now();
+    const tableName = sentinel.dataset.table;
+    const btn = createBtn(tableName, sentinel.dataset.schemaJson);
+    if (lastDisplay && document.contains(lastDisplay) && now - lastDisplayTime < BATCH_MS) {
+      lastDisplay.appendChild(document.createTextNode(", "));
+      lastDisplay.appendChild(btn);
+      sentinel.remove();
+    } else {
+      const p = document.createElement("p");
+      p.className = "qc-schema-display";
+      p.style.cssText = "color:var(--bs-secondary-color,#6c757d);font-size:0.875em;margin:0.1rem 0;";
+      p.appendChild(document.createTextNode("\u{1F50D} Fetched schemas: "));
+      p.appendChild(btn);
+      sentinel.replaceWith(p);
+      lastDisplay = p;
+    }
+    lastDisplayTime = now;
+  }
+  new MutationObserver((mutations) => {
+    for (const { addedNodes } of mutations) {
+      for (const node of addedNodes) {
+        if (node.nodeType !== 1) continue;
+        if (
+          /** @type {Element} */
+          node.classList.contains("qc-schema-collector")
+        ) {
+          processCollector(
+            /** @type {HTMLElement} */
+            node
+          );
+        } else {
+          node.querySelectorAll(".qc-schema-collector").forEach((el) => processCollector(
+            /** @type {HTMLElement} */
+            el
+          ));
+        }
+      }
+    }
+  }).observe(document.body, { subtree: true, childList: true });
+})();
diff --git a/pkg-py/src/querychat/streamlit.py b/pkg-py/src/querychat/streamlit.py
index ddd895bfb..5b82bc3fc 100644
--- a/pkg-py/src/querychat/streamlit.py
+++ b/pkg-py/src/querychat/streamlit.py
@@ -1,5 +1,5 @@
 """Streamlit integration for querychat."""
 
-from ._streamlit import QueryChat
+from ._streamlit import QueryChat, StreamlitTableAccessor
 
-__all__ = ["QueryChat"]
+__all__ = ["QueryChat", "StreamlitTableAccessor"]
diff --git a/pkg-py/src/querychat/tools.py b/pkg-py/src/querychat/tools.py
index 48a17b5cc..b446b1819 100644
--- a/pkg-py/src/querychat/tools.py
+++ b/pkg-py/src/querychat/tools.py
@@ -1,10 +1,18 @@
 from __future__ import annotations
 
+import html
+import json
+from collections.abc import Callable
 from typing import TYPE_CHECKING, Any, Protocol, TypedDict, runtime_checkable
 
-from chatlas import ContentToolResult, Tool
-from shinychat.types import ToolResultDisplay
+from chatlas import ContentToolRequest, ContentToolResult, Tool
+from htmltools import HTMLDependency, TagList, tags
+from pydantic import Field
+from shinychat import message_content_chunk
+from shinychat.types import ChatMessage, ToolResultDisplay
 
+from .__version import __version__
+from ._datasource import ColumnMeta, format_schema
 from ._icons import bs_icon
 from ._utils import (
     as_narwhals,
@@ -16,6 +24,8 @@
 from ._viz_tools import tool_visualize
 
 __all__ = [
+    "GetSchemaResult",
+    "tool_get_schema",
     "tool_query",
     "tool_reset_dashboard",
     "tool_update_dashboard",
@@ -23,9 +33,129 @@
 ]
 
 if TYPE_CHECKING:
-    from collections.abc import Callable
+    from ._data_dict import DataDict
+    from ._query_executor import QueryExecutor
 
-    from ._datasource import DataSource
+
+ResetDashboardCallback = Callable[[str], None]
+
+
+class GetSchemaResult(ContentToolResult):
+    """Tool result that carries schema text and structured column metadata for a single table."""
+
+    table_name: str
+    columns: list[ColumnMeta] = Field(default_factory=list)
+
+
+def _col_to_dict(col: ColumnMeta) -> dict[str, Any]:
+    return {
+        "name": col.name,
+        "sql_type": col.sql_type,
+        "units": col.units,
+        "description": col.description,
+        "min_val": str(col.min_val) if col.min_val is not None else None,
+        "max_val": str(col.max_val) if col.max_val is not None else None,
+        "categories": col.categories,
+        "constraints": col.constraints,
+    }
+
+
+_orig_request_handler = message_content_chunk.dispatch(ContentToolRequest)
+
+
+@message_content_chunk.register
+def _(request: ContentToolRequest) -> ChatMessage:
+    if request.name == "querychat_get_schema":
+        return ChatMessage(content="")
+    return _orig_request_handler(request)
+
+
+@message_content_chunk.register
+def _(message: GetSchemaResult) -> ChatMessage:
+    columns_json = json.dumps([_col_to_dict(c) for c in message.columns])
+    content = TagList(
+        tags.span(
+            class_="qc-schema-collector",
+            data_table=message.table_name,
+            data_schema=str(message.value),
+            data_schema_json=columns_json,
+            style="display:none",
+        ),
+        _schema_dep(),
+    )
+    return ChatMessage(content=content)
+
+
+def _schema_dep() -> HTMLDependency:
+    return HTMLDependency(
+        "querychat-schema-display",
+        __version__,
+        source={"package": "querychat", "subdir": "static"},
+        script=[{"src": "js/schema-display.js"}],
+    )
+
+
+def _get_schema_impl(
+    data_dicts: list[DataDict],
+    executor: QueryExecutor,
+    table_names: list[str],
+    categorical_threshold: int,
+) -> Callable[[str], ContentToolResult]:
+    def get_schema(table_name: str) -> ContentToolResult:
+        if table_name not in table_names:
+            available = ", ".join(table_names)
+            error = f"Table '{table_name}' not found. Available: {available}"
+            return ContentToolResult(value=error, error=Exception(error))
+
+        dd = next((d for d in data_dicts if table_name in d.tables), None)
+        if dd is not None:
+            columns = dd.get_table_schema(table_name, executor, categorical_threshold)
+        else:
+            columns = executor.get_column_details(table_name, categorical_threshold)
+
+        schema_text = format_schema(table_name, columns)
+        return GetSchemaResult(value=schema_text, table_name=table_name, columns=columns)
+
+    return get_schema
+
+
+def tool_get_schema(
+    data_dicts: list[DataDict],
+    executor: QueryExecutor,
+    table_names: list[str],
+    categorical_threshold: int,
+) -> Tool:
+    """
+    Create a tool that retrieves full column details for a table.
+
+    Parameters
+    ----------
+    data_dicts
+        Data dictionaries with enriched column metadata. The first dict that
+        covers a requested table is used; tables not covered by any dict fall
+        back to live statistics from the executor.
+    executor
+        The query executor to use for schema introspection.
+    table_names
+        List of valid table names.
+    categorical_threshold
+        Maximum number of unique values before a text column is treated as
+        free-form rather than categorical.
+
+    Returns
+    -------
+    Tool
+        A tool that can be registered with chatlas.
+
+    """
+    impl = _get_schema_impl(data_dicts, executor, table_names, categorical_threshold)
+    description = read_prompt_template("tool-get-schema.md")
+    impl.__doc__ = description
+    return Tool.from_func(
+        impl,
+        name="querychat_get_schema",
+        annotations={"title": "Get Schema"},
+    )
 
 
 @runtime_checkable
@@ -52,6 +182,8 @@ class UpdateDashboardData(TypedDict):
 
     Attributes
     ----------
+    table
+        The name of the table being filtered.
     query
         The SQL query string to execute for filtering/sorting the dashboard.
     title
@@ -66,6 +198,7 @@ class UpdateDashboardData(TypedDict):
 
 
     def log_update(data: UpdateDashboardData):
+        print(f"Table: {data['table']}")
         print(f"Executing: {data['query']}")
         print(f"Title: {data['title']}")
 
@@ -77,35 +210,45 @@ def log_update(data: UpdateDashboardData):
 
     """
 
+    table: str
     query: str
     title: str
 
 
 def _update_dashboard_impl(
-    data_source: DataSource,
+    executor: QueryExecutor,
+    table_names: list[str],
     update_fn: Callable[[UpdateDashboardData], None],
-) -> Callable[[str, str], ContentToolResult]:
+) -> Callable[[str, str, str], ContentToolResult]:
     """Create the implementation function for updating the dashboard."""
 
-    def update_dashboard(query: str, title: str) -> ContentToolResult:
+    def update_dashboard(table: str, query: str, title: str) -> ContentToolResult:
         error = None
         markdown = f"```sql\n{query}\n```"
         value = "Dashboard updated. Use `query` tool to review results, if needed."
 
+        # Validate table exists
+        if table not in table_names:
+            available = ", ".join(table_names)
+            error = f"Table '{table}' not found. Available: {available}"
+            markdown += f"\n\n> Error: {error}"
+            return ContentToolResult(value=markdown, error=Exception(error))
+
         try:
             # Test the query but don't execute it yet
-            data_source.test_query(query, require_all_columns=True)
+            executor.test_query(query, table_name=table, require_all_columns=True)
 
             # Add Apply Filter button
             button_html = f"""<button
                 class="btn btn-outline-primary btn-sm float-end mt-3 querychat-update-dashboard-btn"
-                data-query="{query}"
-                data-title="{title}">
+                data-table="{html.escape(table, quote=True)}"
+                data-query="{html.escape(query, quote=True)}"
+                data-title="{html.escape(title, quote=True)}">
                 Apply Filter
             </button>"""
 
             # Call the callback with TypedDict data on success
-            update_fn({"query": query, "title": title})
+            update_fn({"table": table, "query": query, "title": title})
 
         except Exception as e:
             error = truncate_error(str(e))
@@ -130,30 +273,38 @@ def update_dashboard(query: str, title: str) -> ContentToolResult:
 
 
 def tool_update_dashboard(
-    data_source: DataSource,
+    executor: QueryExecutor,
+    table_names: list[str],
     update_fn: Callable[[UpdateDashboardData], None],
+    *,
+    multi_table: bool = False,
 ) -> Tool:
     """
-    Create a tool that modifies the data presented in the dashboard based on the SQL query.
+    Create a tool that modifies the data presented in the dashboard.
 
     Parameters
     ----------
-    data_source
-        The data source to query against
+    executor
+        The query executor to validate queries against.
+    table_names
+        List of valid table names for validation.
     update_fn
-        Callback function to call with UpdateDashboardData when update succeeds
+        Callback function to call with UpdateDashboardData when update succeeds.
+    multi_table
+        Whether multiple tables are registered.
 
     Returns
     -------
     Tool
-        A tool that can be registered with chatlas
+        A tool that can be registered with chatlas.
 
     """
-    impl = _update_dashboard_impl(data_source, update_fn)
+    impl = _update_dashboard_impl(executor, table_names, update_fn)
 
     description = read_prompt_template(
         "tool-update-dashboard.md",
-        db_type=data_source.get_db_type(),
+        db_type=executor.get_db_type(),
+        multi_table=multi_table,
     )
     impl.__doc__ = description
 
@@ -165,17 +316,27 @@ def tool_update_dashboard(
 
 
 def _reset_dashboard_impl(
-    reset_fn: Callable[[], None],
-) -> Callable[[], ContentToolResult]:
+    reset_fn: ResetDashboardCallback,
+    table_names: list[str] | None,
+) -> Callable[[str], ContentToolResult]:
     """Create the implementation function for resetting the dashboard."""
 
-    def reset_dashboard() -> ContentToolResult:
+    def reset_dashboard(table: str) -> ContentToolResult:
+        if table_names is not None and table not in table_names:
+            available = ", ".join(table_names)
+            error = f"Table '{table}' not found. Available: {available}"
+            return ContentToolResult(
+                value=error,
+                error=Exception(error),
+            )
+
         # Call the callback to reset
-        reset_fn()
+        reset_fn(table)
 
         # Add Reset Filter button
-        button_html = """<button
+        button_html = f"""<button
             class="btn btn-outline-primary btn-sm float-end mt-3 querychat-update-dashboard-btn"
+            data-table="{html.escape(table, quote=True)}"
             data-query=""
             data-title="">
             Reset Filter
@@ -199,7 +360,8 @@ def reset_dashboard() -> ContentToolResult:
 
 
 def tool_reset_dashboard(
-    reset_fn: Callable[[], None],
+    reset_fn: ResetDashboardCallback,
+    table_names: list[str] | None = None,
 ) -> Tool:
     """
     Create a tool that resets the dashboard to show all data.
@@ -207,15 +369,17 @@ def tool_reset_dashboard(
     Parameters
     ----------
     reset_fn
-        Callback function to call when reset is invoked
+        Callback function to call with table name when reset is requested.
+    table_names
+        Optional list of valid table names for validation.
 
     Returns
     -------
     Tool
-        A tool that can be registered with chatlas
+        A tool that can be registered with chatlas.
 
     """
-    impl = _reset_dashboard_impl(reset_fn)
+    impl = _reset_dashboard_impl(reset_fn, table_names)
 
     description = read_prompt_template("tool-reset-dashboard.md")
     impl.__doc__ = description
@@ -227,7 +391,7 @@ def tool_reset_dashboard(
     )
 
 
-def _query_impl(data_source: DataSource) -> Callable[..., ContentToolResult]:
+def _query_impl(executor: QueryExecutor) -> Callable[..., ContentToolResult]:
     """Create the implementation function for querying data."""
 
     def query(
@@ -240,7 +404,7 @@ def query(
         value = None
 
         try:
-            result_df = data_source.execute_query(query)
+            result_df = executor.execute_query(query)
             nw_df = as_narwhals(result_df)
             value = nw_df.rows(named=True)
 
@@ -270,25 +434,30 @@ def query(
     return query
 
 
-def tool_query(data_source: DataSource) -> Tool:
+def tool_query(executor: QueryExecutor, *, multi_table: bool = False) -> Tool:
     """
     Create a tool that performs a SQL query on the data.
 
     Parameters
     ----------
-    data_source
-        The data source to query against
+    executor
+        The query executor to use for running queries.
+    multi_table
+        Whether multiple tables are registered. When True, multi-table
+        query guidance is included in the tool description.
 
     Returns
     -------
     Tool
-        A tool that can be registered with chatlas
+        A tool that can be registered with chatlas.
 
     """
-    impl = _query_impl(data_source)
+    impl = _query_impl(executor)
 
     description = read_prompt_template(
-        "tool-query.md", db_type=data_source.get_db_type()
+        "tool-query.md",
+        db_type=executor.get_db_type(),
+        multi_table=multi_table,
     )
     impl.__doc__ = description
 
diff --git a/pkg-py/src/querychat/types/__init__.py b/pkg-py/src/querychat/types/__init__.py
index 1bf6f04f7..5f2a76453 100644
--- a/pkg-py/src/querychat/types/__init__.py
+++ b/pkg-py/src/querychat/types/__init__.py
@@ -8,7 +8,8 @@
 )
 from .._pin_source import PinSource
 from .._querychat_core import AppStateDict
-from .._shiny_module import ServerValues
+from .._shiny_module import ServerValues, TableState
+from .._table_accessor import TableAccessor
 from .._utils import UnsafeQueryError
 from .._viz_tools import VisualizeData, VisualizeResult
 from ..tools import UpdateDashboardData
@@ -23,6 +24,8 @@
     "PolarsLazySource",
     "SQLAlchemySource",
     "ServerValues",
+    "TableAccessor",
+    "TableState",
     "UnsafeQueryError",
     "UpdateDashboardData",
     "VisualizeData",
diff --git a/pkg-py/tests/playwright/test_01_hello_app.py b/pkg-py/tests/playwright/test_01_hello_app.py
index 8ca0b8e5c..ec9ff9909 100644
--- a/pkg-py/tests/playwright/test_01_hello_app.py
+++ b/pkg-py/tests/playwright/test_01_hello_app.py
@@ -200,6 +200,40 @@ def test_sql_updates_on_query(self) -> None:
             re.compile(r"WHERE.*sex.*=.*['\"]?male['\"]?", re.IGNORECASE), timeout=60000
         )
 
+    # ==================== Filter Button Tests ====================
+
+    def test_apply_filter_button_re_applies_filter(self) -> None:
+        """FILTER-01: Apply Filter button re-applies the filter after a reset."""
+        self.chat.set_user_input("Show only first class passengers")
+        self.chat.send_user_input(method="click")
+
+        sql_code = self.page.locator("pre code").first
+        expect(sql_code).to_contain_text(
+            re.compile(r"WHERE.*(p?class).*=.*(1|['\"]First['\"])", re.IGNORECASE),
+            timeout=60000,
+        )
+
+        apply_btn = self.page.locator(".querychat-update-dashboard-btn").first
+        expect(apply_btn).to_be_visible(timeout=10000)
+        assert apply_btn.get_attribute("data-table") == "titanic"
+        assert apply_btn.get_attribute("data-query") not in (None, "")
+
+        # Reset the filter directly via Shiny JS (no second LLM call)
+        self.page.evaluate(
+            """
+            window.Shiny.setInputValue(
+                'querychat_titanic-chat_update',
+                {table: 'titanic', query: '', title: ''},
+                {priority: 'event'}
+            );
+            """
+        )
+        expect(self.page.locator("text=891")).to_be_visible(timeout=10000)
+
+        apply_btn.click()
+
+        expect(self.page.locator("text=891")).not_to_be_visible(timeout=5000)
+
     # ==================== Stream Cancellation Tests ====================
 
     def test_stop_button_appears_during_streaming(self) -> None:
diff --git a/pkg-py/tests/playwright/test_03_sidebar_apps.py b/pkg-py/tests/playwright/test_03_sidebar_apps.py
index 64ee7fea0..680e94015 100644
--- a/pkg-py/tests/playwright/test_03_sidebar_apps.py
+++ b/pkg-py/tests/playwright/test_03_sidebar_apps.py
@@ -53,9 +53,9 @@ def test_card_header_initial(self) -> None:
 
     def test_data_table_visible(self) -> None:
         """Data table is visible with rows."""
-        table = self.page.locator("table")
+        table = self.page.locator("table[aria-rowcount]")
         expect(table).to_be_visible()
-        rows = self.page.locator("table tbody tr")
+        rows = self.page.locator("table[aria-rowcount] tbody tr")
         expect(rows.first).to_be_visible()
 
     def test_chat_input_visible(self) -> None:
@@ -96,7 +96,7 @@ def test_filter_query_updates_table(self) -> None:
         )
 
         # Table should still be visible (with filtered data)
-        table = self.page.locator("table")
+        table = self.page.locator("table[aria-rowcount]")
         expect(table).to_be_visible()
 
     def test_analytical_query_in_chat(self) -> None:
@@ -137,9 +137,9 @@ def test_card_header_initial(self) -> None:
 
     def test_data_table_visible(self) -> None:
         """Data table is visible with rows."""
-        table = self.page.locator("table")
+        table = self.page.locator("table[aria-rowcount]")
         expect(table).to_be_visible()
-        rows = self.page.locator("table tbody tr")
+        rows = self.page.locator("table[aria-rowcount] tbody tr")
         expect(rows.first).to_be_visible()
 
     def test_chat_input_visible(self) -> None:
@@ -180,7 +180,7 @@ def test_filter_query_updates_table(self) -> None:
         )
 
         # Table should still be visible (with filtered data)
-        table = self.page.locator("table")
+        table = self.page.locator("table[aria-rowcount]")
         expect(table).to_be_visible()
 
     def test_analytical_query_in_chat(self) -> None:
diff --git a/pkg-py/tests/test_base.py b/pkg-py/tests/test_base.py
index cffb932fa..9680e188c 100644
--- a/pkg-py/tests/test_base.py
+++ b/pkg-py/tests/test_base.py
@@ -1,12 +1,16 @@
 """Tests for QueryChatBase and normalization functions."""
 
 import os
+import warnings
+from pathlib import Path
 from typing import Any
 
 import chatlas
 import narwhals.stable.v1 as nw
 import pandas as pd
+import polars as pl
 import pytest
+from querychat._data_dict import DataDict, TableSpec
 from querychat._datasource import DataFrameSource, SQLAlchemySource
 from querychat._querychat_base import (
     QueryChatBase,
@@ -14,6 +18,7 @@
     normalize_data_source,
     normalize_tools,
 )
+from querychat._shiny import QueryChat
 from querychat._utils import MISSING
 from sqlalchemy import create_engine, text
 
@@ -170,9 +175,18 @@ def test_filter_and_update_deduplicated(self):
 
 
 class TestQueryChatBase:
+    def test_init_no_args(self):
+        qc = QueryChatBase()
+        assert qc.table_names() == []
+
+    def test_init_no_args_then_add_table(self, sample_df):
+        qc = QueryChatBase()
+        qc.add_table(sample_df, "test_table")
+        assert qc.table_names() == ["test_table"]
+
     def test_init_with_dataframe(self, sample_df):
         qc = QueryChatBase(sample_df, "test_table")
-        assert isinstance(qc.data_source, DataFrameSource)
+        assert isinstance(qc._data_sources["test_table"], DataFrameSource)
         assert qc.tools == {"update", "query"}
 
     def test_init_with_custom_greeting(self, sample_df):
@@ -194,10 +208,6 @@ def test_invalid_table_name_raises(self, sample_df):
         with pytest.raises(ValueError, match="Table name must begin with a letter"):
             QueryChatBase(sample_df, "table-with-dash")
 
-    def test_data_source_property(self, sample_df):
-        qc = QueryChatBase(sample_df, "test_table")
-        assert qc.data_source is qc._data_source
-
     def test_system_prompt_property(self, sample_df):
         qc = QueryChatBase(sample_df, "test_table")
         prompt = qc.system_prompt
@@ -213,6 +223,7 @@ def test_client_with_tools_none(self, sample_df):
         qc = QueryChatBase(sample_df, "test_table")
         client = qc.client(tools=None)
         assert isinstance(client, chatlas.Chat)
+        assert client.get_tools() == []
 
     def test_client_with_callbacks(self, sample_df):
         qc = QueryChatBase(sample_df, "test_table")
@@ -234,3 +245,121 @@ def reset_dashboard():
     def test_cleanup(self, sample_df):
         qc = QueryChatBase(sample_df, "test_table")
         qc.cleanup()
+
+
+class TestDataDict:
+    def test_data_dict_path_accepted(self, tmp_path: Path) -> None:
+        f = tmp_path / "spec.yaml"
+        f.write_text('version: "0.1.0"\ntables:\n  t:\n    columns: []\n')
+        df = pl.DataFrame({"x": [1]})
+        qc = QueryChat(df, table_name="t", data_dict=str(f))
+        assert len(qc._data_dicts) == 1
+        assert "t" in qc._data_dicts[0].tables
+
+    def test_data_dict_instance_accepted(self) -> None:
+        dd = DataDict(tables={"t": TableSpec(columns=[])})
+        df = pl.DataFrame({"x": [1]})
+        qc = QueryChat(df, table_name="t", data_dict=dd)
+        assert qc._data_dicts[0] is dd
+
+    def test_data_dict_table_not_in_dict_is_allowed(self) -> None:
+        dd = DataDict(tables={"other": TableSpec(columns=[])})
+        df = pl.DataFrame({"x": [1]})
+        qc = QueryChat(df, table_name="t", data_dict=dd)
+        assert "t" in qc._data_sources
+
+    def test_add_table_not_in_data_dict_is_allowed(self) -> None:
+        dd = DataDict(
+            tables={"t1": TableSpec(columns=[])},
+        )
+        df = pl.DataFrame({"x": [1]})
+        qc = QueryChat(df, table_name="t1", data_dict=dd)
+        df2 = pl.DataFrame({"y": [2]})
+        qc.add_table(df2, "t2")
+        assert "t2" in qc._data_sources
+
+    def test_data_description_accepted(self) -> None:
+        df = pl.DataFrame({"x": [1]})
+        with warnings.catch_warnings(record=True) as w:
+            warnings.simplefilter("always")
+            QueryChat(df, table_name="t", data_description="some desc")
+        assert not any(issubclass(warning.category, DeprecationWarning) for warning in w)
+
+
+@pytest.fixture
+def multi_table_engine():
+    engine = create_engine("sqlite:///:memory:")
+    with engine.connect() as conn:
+        conn.execute(
+            text(
+                "CREATE TABLE orders (id INTEGER PRIMARY KEY, amount REAL)"
+            )
+        )
+        conn.execute(
+            text(
+                "CREATE TABLE customers (id INTEGER PRIMARY KEY, name TEXT)"
+            )
+        )
+        conn.execute(text("INSERT INTO orders VALUES (1, 99.99), (2, 49.50)"))
+        conn.execute(text("INSERT INTO customers VALUES (1, 'Alice'), (2, 'Bob')"))
+        conn.commit()
+    return engine
+
+
+class TestAddTables:
+    def test_auto_discovery_registers_all_tables(self, multi_table_engine):
+        qc = QueryChatBase()
+        with warnings.catch_warnings(record=True):
+            warnings.simplefilter("always")
+            qc.add_tables(multi_table_engine)
+        assert set(qc.table_names()) == {"orders", "customers"}
+
+    def test_explicit_tables_registers_only_those(self, multi_table_engine):
+        qc = QueryChatBase()
+        qc.add_tables(multi_table_engine, ["orders"])
+        assert qc.table_names() == ["orders"]
+
+    def test_nonexistent_table_raises(self, multi_table_engine):
+        qc = QueryChatBase()
+        with pytest.raises(ValueError, match="'nonexistent' not found"):
+            qc.add_tables(multi_table_engine, ["nonexistent"])
+
+    def test_duplicate_without_replace_raises(self, multi_table_engine):
+        qc = QueryChatBase()
+        qc.add_tables(multi_table_engine, ["orders"])
+        with pytest.raises(ValueError, match="Table 'orders' already exists"):
+            qc.add_tables(multi_table_engine, ["orders"])
+
+    def test_replace_true_succeeds(self, multi_table_engine):
+        qc = QueryChatBase()
+        qc.add_tables(multi_table_engine, ["orders"])
+        qc.add_tables(multi_table_engine, ["orders"], replace=True)
+        assert "orders" in qc.table_names()
+
+    def test_non_engine_raises_type_error(self, sample_df):
+        qc = QueryChatBase()
+        with pytest.raises(TypeError, match=r"sqlalchemy\.Engine"):
+            qc.add_tables(sample_df)  # type: ignore[arg-type]
+
+    def test_empty_list_raises(self, multi_table_engine):
+        qc = QueryChatBase()
+        with pytest.raises(ValueError, match="No tables found"):
+            qc.add_tables(multi_table_engine, [])
+
+    def test_after_server_raises(self, multi_table_engine):
+        qc = QueryChatBase()
+        qc._server_initialized = True
+        with pytest.raises(RuntimeError, match="Cannot add tables after server"):
+            qc.add_tables(multi_table_engine)
+
+    def test_system_prompt_built_exactly_once(self, multi_table_engine):
+        qc = QueryChatBase()
+        with warnings.catch_warnings(record=True) as w:
+            warnings.simplefilter("always")
+            qc.add_tables(multi_table_engine)
+        multi_table_warns = [
+            x for x in w
+            if issubclass(x.category, UserWarning)
+            and "Multiple tables" in str(x.message)
+        ]
+        assert len(multi_table_warns) == 1
diff --git a/pkg-py/tests/test_client_console.py b/pkg-py/tests/test_client_console.py
index f9d32e5b2..b147c329c 100644
--- a/pkg-py/tests/test_client_console.py
+++ b/pkg-py/tests/test_client_console.py
@@ -132,6 +132,16 @@ def my_reset():
         # Callback should be registered
         assert client is not None
 
+    def test_client_prompt_requires_table_for_reset_dashboard(self, sample_df):
+        """Reset guidance in the prompt should match the tool contract."""
+        qc = QueryChat(sample_df, "test_table", greeting="Hello!")
+
+        prompt = qc.client().system_prompt
+
+        assert "querychat_reset_dashboard()" not in prompt
+        assert "querychat_reset_dashboard" in prompt
+        assert "relevant `table`" in prompt
+
     def test_client_respects_initialization_tools(self, sample_df):
         """Test that client() respects tools set at initialization."""
         qc = QueryChat(sample_df, "test_table", greeting="Hello!", tools="query")
diff --git a/pkg-py/tests/test_data_dict.py b/pkg-py/tests/test_data_dict.py
new file mode 100644
index 000000000..891d39bcb
--- /dev/null
+++ b/pkg-py/tests/test_data_dict.py
@@ -0,0 +1,233 @@
+from pathlib import Path
+
+import narwhals.stable.v1 as nw
+import polars as pl
+from querychat._data_dict import ColumnRange, ColumnSpec, DataDict, TableSpec
+from querychat._datasource import DataFrameSource
+from querychat._query_executor import DataSourceExecutor
+
+
+def test_from_yaml_full_spec(tmp_path: Path) -> None:
+    yaml_content = """\
+version: "0.1.0"
+tables:
+  orders:
+    description: One row per order.
+    columns:
+      - name: order_id
+        type: number(id)
+        constraints: [primary_key]
+        description: Unique order identifier.
+        examples: [1, 2, 3]
+      - name: amount
+        type: number(quantity)
+        range:
+          min: 0
+          max: 10000
+      - name: status
+        type: enum
+        values: [pending, shipped, delivered]
+relationships:
+  - description: Order placed by customer.
+    cardinality: many-to-one
+    join: orders.customer_id = customers.id
+glossary:
+  churn: Customer with no orders in 90+ days.
+"""
+    f = tmp_path / "spec.yaml"
+    f.write_text(yaml_content)
+    dd = DataDict.from_yaml(f)
+
+    assert "orders" in dd.tables
+    t = dd.tables["orders"]
+    assert t.description == "One row per order."
+    assert len(t.columns) == 3
+
+    col = t.columns[0]
+    assert col.name == "order_id"
+    assert col.description == "Unique order identifier."
+    assert col.constraints == ["primary_key"]
+
+    col = t.columns[1]
+    assert col.range is not None
+    assert col.range.min == 0
+    assert col.range.max == 10000
+
+    col = t.columns[2]
+    assert col.values == ["pending", "shipped", "delivered"]
+
+    assert len(dd.relationships) == 1
+    assert dd.relationships[0].join == "orders.customer_id = customers.id"
+    assert dd.relationships[0].cardinality == "many-to-one"
+    assert dd.glossary["churn"] == "Customer with no orders in 90+ days."
+
+
+def test_from_yaml_partial_spec(tmp_path: Path) -> None:
+    f = tmp_path / "spec.yaml"
+    f.write_text('version: "0.1.0"\ntables:\n  orders:\n    columns: []\n')
+    dd = DataDict.from_yaml(f)
+    assert dd.tables["orders"].description is None
+    assert dd.relationships == []
+    assert dd.glossary == {}
+
+
+def test_from_yaml_str_path(tmp_path: Path) -> None:
+    f = tmp_path / "spec.yaml"
+    f.write_text('version: "0.1.0"\n')
+    dd = DataDict.from_yaml(str(f))
+    assert dd.tables == {}
+
+
+def test_name_and_description_are_optional() -> None:
+    dd = DataDict()
+    assert dd.name is None
+    assert dd.description is None
+
+
+def test_from_yaml_derives_name_from_file_stem(tmp_path: Path) -> None:
+    f = tmp_path / "my_schema.yaml"
+    f.write_text('version: "0.1.0"\n')
+    dd = DataDict.from_yaml(f)
+    assert dd.name == "my_schema"
+
+
+def test_from_yaml_explicit_name_overrides_stem(tmp_path: Path) -> None:
+    f = tmp_path / "file_name.yaml"
+    f.write_text("name: custom_name\n")
+    dd = DataDict.from_yaml(f)
+    assert dd.name == "custom_name"
+
+
+def test_from_yaml_loads_description(tmp_path: Path) -> None:
+    f = tmp_path / "spec.yaml"
+    f.write_text('description: "Sales data"\n')
+    dd = DataDict.from_yaml(f)
+    assert dd.description == "Sales data"
+
+
+def test_from_yaml_description_defaults_to_none(tmp_path: Path) -> None:
+    f = tmp_path / "spec.yaml"
+    f.write_text('version: "0.1.0"\n')
+    dd = DataDict.from_yaml(f)
+    assert dd.description is None
+
+
+def _make_executor(df: pl.DataFrame, table_name: str) -> DataSourceExecutor:
+    source = DataFrameSource(nw.from_native(df), table_name)
+    return DataSourceExecutor({table_name: source})
+
+
+def test_get_table_schema_all_documented() -> None:
+    dd = DataDict(
+        tables={
+            "orders": TableSpec(
+                description="Order records.",
+                columns=[
+                    ColumnSpec(
+                        name="amount",
+                        description="Order total in USD.",
+                        range=ColumnRange(min=0, max=500),
+                    ),
+                    ColumnSpec(
+                        name="status",
+                        values=["pending", "shipped"],
+                    ),
+                ],
+            )
+        },
+    )
+    df = pl.DataFrame({"amount": [10, 20], "status": ["pending", "shipped"]})
+    executor = _make_executor(df, "orders")
+    cols = dd.get_table_schema("orders", executor, categorical_threshold=10)
+    col_map = {c.name: c for c in cols}
+    assert "amount" in col_map
+    assert col_map["amount"].min_val == 0
+    assert col_map["amount"].max_val == 500
+    assert col_map["amount"].description == "Order total in USD."
+    assert "status" in col_map
+    assert "pending" in col_map["status"].categories
+
+
+def test_get_table_schema_no_documentation() -> None:
+    dd = DataDict(tables={"orders": TableSpec(columns=[])})
+    df = pl.DataFrame({"amount": [10, 20, 30], "status": ["a", "b", "a"]})
+    executor = _make_executor(df, "orders")
+    cols = dd.get_table_schema("orders", executor, categorical_threshold=10)
+    col_names = [c.name for c in cols]
+    # SQL fallback should populate stats
+    assert "amount" in col_names
+    assert "status" in col_names
+
+
+def test_get_table_schema_mixed_coverage() -> None:
+    dd = DataDict(
+        tables={
+            "orders": TableSpec(
+                columns=[
+                    ColumnSpec(name="amount", range=ColumnRange(min=0, max=999)),
+                ]
+            )
+        },
+    )
+    df = pl.DataFrame({"amount": [10, 20], "status": ["a", "b"]})
+    executor = _make_executor(df, "orders")
+    cols = dd.get_table_schema("orders", executor, categorical_threshold=10)
+    col_map = {c.name: c for c in cols}
+    assert col_map["amount"].min_val == 0  # from data_dict
+    assert col_map["amount"].max_val == 999
+    assert "status" in col_map            # from SQL fallback
+
+
+def test_to_prompt_dict_excludes_column_specs() -> None:
+    dd = DataDict(
+        name="sales",
+        tables={
+            "orders": TableSpec(
+                description="Order records.",
+                columns=[ColumnSpec(name="amount", range=ColumnRange(min=0, max=100))],
+            )
+        },
+    )
+    d = dd.to_prompt_dict()
+    assert "columns" not in (d.get("tables", {}).get("orders") or {})
+
+
+def test_to_prompt_dict_includes_table_description() -> None:
+    dd = DataDict(tables={"orders": TableSpec(description="Order records.")})
+    d = dd.to_prompt_dict()
+    assert d["tables"]["orders"]["description"] == "Order records."
+
+
+def test_to_prompt_dict_table_with_no_description_is_null() -> None:
+    dd = DataDict(tables={"orders": TableSpec()})
+    d = dd.to_prompt_dict()
+    assert d["tables"]["orders"] is None
+
+
+def test_to_prompt_dict_excludes_none_name() -> None:
+    dd = DataDict()
+    d = dd.to_prompt_dict()
+    assert "name" not in d
+
+
+def test_to_prompt_dict_excludes_none_description() -> None:
+    dd = DataDict(name="sales")
+    d = dd.to_prompt_dict()
+    assert "description" not in d
+
+
+def test_to_prompt_dict_includes_relationships() -> None:
+    from querychat._data_dict import RelationshipSpec
+
+    dd = DataDict(
+        relationships=[RelationshipSpec(join="a.id = b.id", cardinality="one-to-many")]
+    )
+    d = dd.to_prompt_dict()
+    assert d["relationships"][0]["join"] == "a.id = b.id"
+    assert d["relationships"][0]["cardinality"] == "one-to-many"
+
+
+def test_to_prompt_dict_includes_glossary() -> None:
+    dd = DataDict(glossary={"ARR": "Annual Recurring Revenue"})
+    d = dd.to_prompt_dict()
+    assert d["glossary"]["ARR"] == "Annual Recurring Revenue"
diff --git a/pkg-py/tests/test_datasource.py b/pkg-py/tests/test_datasource.py
index 913d9a424..7ae30b4e3 100644
--- a/pkg-py/tests/test_datasource.py
+++ b/pkg-py/tests/test_datasource.py
@@ -5,7 +5,12 @@
 import narwhals.stable.v1 as nw
 import pandas as pd
 import pytest
-from querychat._datasource import DataFrameSource, SQLAlchemySource
+from querychat._datasource import (
+    ColumnMeta,
+    DataFrameSource,
+    SQLAlchemySource,
+    format_schema,
+)
 from querychat._utils import UnsafeQueryError, check_query
 from querychat.types import MissingColumnsError
 from sqlalchemy import create_engine, text
@@ -503,3 +508,61 @@ def test_check_query_escape_hatch_accepts_various_values(monkeypatch):
     for value in ["true", "TRUE", "1", "yes", "YES"]:
         monkeypatch.setenv("QUERYCHAT_ENABLE_UPDATE_QUERIES", value)
         check_query("INSERT INTO table VALUES (1)")  # Should not raise
+
+
+# -- ColumnMeta.description and format_schema tests --
+
+
+@pytest.fixture
+def sample_df():
+    """Create a sample pandas DataFrame for testing."""
+    return pd.DataFrame(
+        {
+            "id": [1, 2, 3],
+            "name": ["Alice", "Bob", "Charlie"],
+            "age": [25, 30, 35],
+            "salary": [50000.0, 60000.0, 70000.0],
+        }
+    )
+
+
+def test_column_meta_has_description_field() -> None:
+    meta = ColumnMeta(name="x", sql_type="TEXT", kind="text")
+    assert meta.description is None
+    meta2 = ColumnMeta(name="x", sql_type="TEXT", kind="text", description="A column")
+    assert meta2.description == "A column"
+
+
+def test_format_schema_includes_description() -> None:
+    cols = [
+        ColumnMeta(name="id", sql_type="INTEGER", kind="numeric", description="Primary key"),
+        ColumnMeta(name="name", sql_type="TEXT", kind="text"),
+    ]
+    result = format_schema("mytable", cols)
+    assert "Description: Primary key" in result
+    assert "name" in result
+
+
+def test_dataframe_source_get_column_metas(sample_df) -> None:
+    source = DataFrameSource(nw.from_native(sample_df), "test")
+    metas = source.get_column_metas()
+    assert len(metas) > 0
+    assert all(isinstance(m, ColumnMeta) for m in metas)
+    # Stats should NOT be populated yet
+    assert all(m.min_val is None for m in metas if m.kind == "numeric")
+
+
+def test_dataframe_source_populate_column_stats(sample_df) -> None:
+    source = DataFrameSource(nw.from_native(sample_df), "test")
+    metas = source.get_column_metas()
+    source.populate_column_stats(metas, categorical_threshold=10)
+    numeric_metas = [m for m in metas if m.kind == "numeric"]
+    if numeric_metas:
+        assert numeric_metas[0].min_val is not None
+
+
+def test_dataframe_source_get_schema_unchanged(sample_df) -> None:
+    source = DataFrameSource(nw.from_native(sample_df), "test")
+    schema = source.get_schema(categorical_threshold=10)
+    assert "Table: test" in schema
+    assert "Columns:" in schema
diff --git a/pkg-py/tests/test_deferred_client.py b/pkg-py/tests/test_deferred_client.py
index bdd2f6aa0..cd3d6f022 100644
--- a/pkg-py/tests/test_deferred_client.py
+++ b/pkg-py/tests/test_deferred_client.py
@@ -2,7 +2,7 @@
 
 import pandas as pd
 import pytest
-from chatlas import ChatOpenAI
+from chatlas import ChatOpenAI, Turn
 from querychat._querychat_base import QueryChatBase
 
 
@@ -55,21 +55,21 @@ def test_client_method_requires_data_source(self):
         """client() should raise if data_source is not set."""
         qc = QueryChatBase(None, "users")
 
-        with pytest.raises(RuntimeError, match="data_source must be set"):
+        with pytest.raises(RuntimeError, match="At least one data source"):
             qc.client()
 
     def test_console_requires_data_source(self):
         """console() should raise if data_source is not set."""
         qc = QueryChatBase(None, "users")
 
-        with pytest.raises(RuntimeError, match="data_source must be set"):
+        with pytest.raises(RuntimeError, match="At least one data source"):
             qc.console()
 
     def test_generate_greeting_requires_data_source(self):
         """generate_greeting() should raise if data_source is not set."""
         qc = QueryChatBase(None, "users")
 
-        with pytest.raises(RuntimeError, match="data_source must be set"):
+        with pytest.raises(RuntimeError, match="At least one data source"):
             qc.generate_greeting()
 
 
@@ -81,10 +81,10 @@ def test_deferred_data_source_uses_default_client(self, sample_df, monkeypatch):
         monkeypatch.setenv("OPENAI_API_KEY", "sk-dummy-key-for-testing")
 
         qc = QueryChatBase(None, "users")
-        assert qc.data_source is None
+        assert len(qc.table_names()) == 0
         assert qc._client_spec is None
 
-        qc.data_source = sample_df
+        qc.add_table(sample_df, "users")
 
         client = qc.client()
         assert client is not None
@@ -95,7 +95,7 @@ def test_deferred_explicit_client_at_init_then_data_source(self, sample_df, monk
         monkeypatch.setenv("OPENAI_API_KEY", "sk-dummy-key-for-testing")
 
         qc = QueryChatBase(None, "users", client="openai")
-        qc.data_source = sample_df
+        qc.add_table(sample_df, "users")
 
         client = qc.client()
         assert client is not None
@@ -111,7 +111,7 @@ def test_no_openai_key_error_when_deferred(self, monkeypatch):
     def test_invalid_explicit_client_raises_when_client_is_resolved(self, sample_df):
         """Invalid explicit client specs should fail when a live client is requested."""
         qc = QueryChatBase(None, "users", client="not_a_real_provider_xyz123")
-        qc.data_source = sample_df
+        qc.add_table(sample_df, "users")
 
         with pytest.raises(ValueError, match="is not a known chatlas provider"):
             qc.client()
@@ -125,7 +125,7 @@ def test_immediate_pattern_unchanged(self, sample_df, monkeypatch):
         monkeypatch.setenv("OPENAI_API_KEY", "sk-dummy-key-for-testing")
         qc = QueryChatBase(sample_df, "test_table")
 
-        assert qc.data_source is not None
+        assert len(qc.table_names()) > 0
         # _client_spec is None (will use env default at resolution time)
         assert qc._client_spec is None
 
@@ -134,3 +134,40 @@ def test_immediate_pattern_unchanged(self, sample_df, monkeypatch):
 
         prompt = qc.system_prompt
         assert "test_table" in prompt
+
+
+@pytest.fixture
+def other_df():
+    return pd.DataFrame({"order_id": [1, 2], "amount": [100, 200]})
+
+
+class TestPromptRebuildWarning:
+    """Warns when system prompt is rebuilt after a client already has chat history."""
+
+    def test_warns_when_client_spec_has_history(self, sample_df, monkeypatch):
+        monkeypatch.setenv("OPENAI_API_KEY", "sk-dummy-key-for-testing")
+        chat = ChatOpenAI()
+        chat.set_turns([Turn(role="user", contents=["hello"])])
+
+        qc = QueryChatBase(None, "users", client=chat)
+
+        with pytest.warns(UserWarning, match="chat history"):
+            qc.add_table(sample_df, "users")
+
+    def test_warns_when_console_client_has_history(self, sample_df, other_df, monkeypatch):
+        monkeypatch.setenv("OPENAI_API_KEY", "sk-dummy-key-for-testing")
+        qc = QueryChatBase(sample_df, "users")
+
+        console_chat = ChatOpenAI()
+        console_chat.set_turns([Turn(role="user", contents=["hello"])])
+        qc._client_console = console_chat
+
+        with pytest.warns(UserWarning, match="chat history"):
+            qc.add_table(other_df, "orders")
+
+    def test_no_warning_without_history(self, sample_df, other_df, recwarn, monkeypatch):
+        monkeypatch.setenv("OPENAI_API_KEY", "sk-dummy-key-for-testing")
+        qc = QueryChatBase(sample_df, "users")
+        qc.add_table(other_df, "orders")
+        chat_history_warnings = [w for w in recwarn.list if "chat history" in str(w.message)]
+        assert len(chat_history_warnings) == 0
diff --git a/pkg-py/tests/test_deferred_datasource.py b/pkg-py/tests/test_deferred_datasource.py
index 522c98ec9..f5a2e611a 100644
--- a/pkg-py/tests/test_deferred_datasource.py
+++ b/pkg-py/tests/test_deferred_datasource.py
@@ -1,4 +1,4 @@
-"""Tests for deferred data source initialization."""
+"""Tests for deferred data source patterns using add_table()."""
 
 import os
 
@@ -9,7 +9,6 @@
 
 @pytest.fixture(autouse=True)
 def set_dummy_api_key():
-    """Set a dummy OpenAI API key for testing."""
     old_api_key = os.environ.get("OPENAI_API_KEY")
     os.environ["OPENAI_API_KEY"] = "sk-dummy-api-key-for-testing"
     yield
@@ -21,112 +20,104 @@ def set_dummy_api_key():
 
 @pytest.fixture
 def sample_df():
-    """Create a sample pandas DataFrame for testing."""
     return pd.DataFrame(
         {
             "id": [1, 2, 3],
             "name": ["Alice", "Bob", "Charlie"],
             "age": [25, 30, 35],
-        },
+        }
     )
 
 
-class TestDeferredDataSourceInit:
-    """Tests for initializing QueryChatBase with None data_source."""
+class TestAddTableDeferred:
+    """Tests for deferred data source using add_table()."""
 
-    def test_init_with_none_data_source(self):
-        """QueryChatBase should accept None data_source with table_name."""
+    def test_add_table_after_deferred_init(self, sample_df):
+        """add_table should work after deferred __init__(None)."""
         qc = QueryChatBase(None, "users")
-        assert qc._data_source is None
-        assert qc._table_name == "users"
+        qc.add_table(sample_df, "users")
 
-    def test_init_with_none_requires_table_name(self):
-        """QueryChatBase with None data_source must have explicit table_name."""
-        # This should work - table_name is explicitly provided
-        qc = QueryChatBase(None, "users")
-        assert qc._table_name == "users"
-
-
-class TestDataSourceProperty:
-    """Tests for the data_source property setter."""
-
-    def test_data_source_setter(self, sample_df):
-        """Setting data_source should normalize and build system prompt."""
-        qc = QueryChatBase(None, "users")
-        qc.data_source = sample_df
-
-        assert qc._data_source is not None
-        assert qc._data_source.table_name == "users"
-        # System prompt should now be built
+        assert "users" in qc.table_names()
+        assert qc._data_sources["users"].table_name == "users"
         assert "users" in qc.system_prompt
 
-    def test_data_source_can_be_changed(self, sample_df):
-        """data_source can be changed after initial set."""
+    def test_add_table_replace(self, sample_df):
+        """add_table(replace=True) should replace an existing table."""
         qc = QueryChatBase(sample_df, "original")
 
         new_df = pd.DataFrame({"x": [1, 2], "y": [3, 4]})
-        qc.data_source = new_df
+        qc.add_table(new_df, "original", replace=True)
 
-        # Should have new data source with original table_name
-        assert qc._data_source is not None
-        # System prompt should be rebuilt
+        assert "original" in qc.table_names()
         assert "original" in qc.system_prompt
 
-    def test_data_source_getter_returns_none_when_not_set(self):
-        """data_source property returns None when not set."""
+    def test_no_tables_when_deferred(self):
+        """table_names() should return empty list when deferred."""
         qc = QueryChatBase(None, "users")
-        assert qc.data_source is None
+        assert qc.table_names() == []
 
 
 class TestMethodRequirements:
-    """Tests that methods properly require data_source to be set."""
+    """Tests that methods properly require at least one data source."""
 
     def test_client_requires_data_source(self):
-        """client() should raise if data_source not set."""
         qc = QueryChatBase(None, "users")
 
-        with pytest.raises(RuntimeError, match="data_source must be set"):
+        with pytest.raises(RuntimeError, match="At least one data source"):
             qc.client()
 
     def test_console_requires_data_source(self):
-        """console() should raise if data_source not set."""
         qc = QueryChatBase(None, "users")
 
-        with pytest.raises(RuntimeError, match="data_source must be set"):
+        with pytest.raises(RuntimeError, match="At least one data source"):
             qc.console()
 
     def test_generate_greeting_requires_data_source(self):
-        """generate_greeting() should raise if data_source not set."""
         qc = QueryChatBase(None, "users")
 
-        with pytest.raises(RuntimeError, match="data_source must be set"):
+        with pytest.raises(RuntimeError, match="At least one data source"):
             qc.generate_greeting()
 
     def test_system_prompt_requires_data_source(self):
-        """system_prompt property should raise if data_source not set."""
         qc = QueryChatBase(None, "users")
 
-        with pytest.raises(RuntimeError, match="data_source must be set"):
+        with pytest.raises(RuntimeError, match="At least one data source"):
             _ = qc.system_prompt
 
-    def test_cleanup_safe_when_data_source_not_set(self):
-        """cleanup() should not raise when data_source is None."""
+    def test_cleanup_safe_when_no_data_sources(self):
         qc = QueryChatBase(None, "users")
-        # Should not raise
         qc.cleanup()
 
 
+class TestNoArgConstruction:
+    """Tests for QueryChatBase() with no positional arguments."""
+
+    def test_init_no_args(self):
+        qc = QueryChatBase()
+        assert qc.table_names() == []
+
+    def test_init_no_args_then_add_table(self, sample_df):
+        qc = QueryChatBase()
+        qc.add_table(sample_df, "test_table")
+        assert qc.table_names() == ["test_table"]
+
+    def test_init_no_args_then_add_multiple_tables(self, sample_df):
+        df2 = pd.DataFrame({"x": [1, 2], "y": [3, 4]})
+        qc = QueryChatBase()
+        qc.add_table(sample_df, "users")
+        qc.add_table(df2, "extra")
+        assert qc.table_names() == ["users", "extra"]
+
+
 class TestBackwardCompatibility:
     """Tests that existing patterns continue to work."""
 
     def test_immediate_pattern_unchanged(self, sample_df):
-        """Existing code with data_source continues to work."""
         qc = QueryChatBase(sample_df, "test_table")
 
-        assert qc.data_source is not None
-        assert qc.data_source.table_name == "test_table"
+        assert len(qc.table_names()) > 0
+        assert qc._data_sources["test_table"].table_name == "test_table"
 
-        # All methods should work immediately
         client = qc.client()
         assert client is not None
 
@@ -137,28 +128,23 @@ def test_immediate_pattern_unchanged(self, sample_df):
 class TestDeferredPatternIntegration:
     """Integration tests for the full deferred pattern workflow."""
 
-    def test_deferred_then_set_property(self, sample_df):
-        """Test setting data_source via property after init."""
+    def test_deferred_then_add_table(self, sample_df):
         qc = QueryChatBase(None, "users")
-        assert qc.data_source is None
+        assert len(qc.table_names()) == 0
         assert qc._client_spec is None
 
-        qc.data_source = sample_df
-        assert qc.data_source is not None
+        qc.add_table(sample_df, "users")
+        assert len(qc.table_names()) > 0
 
         client = qc.client()
         assert client is not None
         assert "users" in qc.system_prompt
 
-    def test_data_source_change_rebuilds_prompt(self, sample_df):
-        """Test that changing data_source rebuilds system prompt."""
+    def test_replace_table_rebuilds_prompt(self, sample_df):
         qc = QueryChatBase(sample_df, "original")
-        original_prompt = qc.system_prompt
 
         new_df = pd.DataFrame({"different": [1, 2], "columns": [3, 4]})
-        qc.data_source = new_df
+        qc.add_table(new_df, "original", replace=True)
 
         new_prompt = qc.system_prompt
-
-        assert original_prompt != new_prompt
         assert "original" in new_prompt
diff --git a/pkg-py/tests/test_deferred_shiny.py b/pkg-py/tests/test_deferred_shiny.py
index 96ba29656..f239661ac 100644
--- a/pkg-py/tests/test_deferred_shiny.py
+++ b/pkg-py/tests/test_deferred_shiny.py
@@ -1,6 +1,7 @@
 """Tests for deferred data source in Shiny QueryChat."""
 
 import os
+from unittest.mock import MagicMock
 
 import chatlas
 import pandas as pd
@@ -9,6 +10,7 @@
 from querychat import QueryChat
 from querychat._querychat_base import create_client as _create_client
 from querychat.express import QueryChat as ExpressQueryChat
+from shiny._namespaces import Root
 from shiny.express._stub_session import ExpressStubSession
 from shiny.session import session_context
 
@@ -37,35 +39,45 @@ def sample_df():
     )
 
 
+class TestNoArgConstruction:
+    """Tests for QueryChat() with no positional arguments."""
+
+    def test_init_no_args(self):
+        qc = QueryChat()
+        assert qc.table_names() == []
+        assert qc.id == "querychat"
+
+    def test_init_no_args_then_add_table(self, sample_df):
+        qc = QueryChat()
+        qc.add_table(sample_df, "users")
+        assert qc.table_names() == ["users"]
+
+
 class TestShinyDeferredDataSource:
     """Tests for deferred data source in Shiny QueryChat."""
 
     def test_init_with_none(self):
         """Shiny QueryChat should accept None data_source."""
         qc = QueryChat(None, "users")
-        assert qc._data_source is None
-        assert qc._table_name == "users"
-        # ID should use table_name even with None data_source
+        assert len(qc.table_names()) == 0
         assert qc.id == "querychat_users"
 
     def test_ui_works_without_data_source(self):
         """ui() should work without data_source set."""
         qc = QueryChat(None, "users")
-        # Should not raise
         ui = qc.ui()
         assert ui is not None
 
     def test_sidebar_works_without_data_source(self):
         """sidebar() should work without data_source set."""
         qc = QueryChat(None, "users")
-        # Should not raise
         sidebar = qc.sidebar()
         assert sidebar is not None
 
     def test_app_requires_data_source(self):
         """app() should raise if data_source not set."""
         qc = QueryChat(None, "users")
-        with pytest.raises(RuntimeError, match="data_source must be set"):
+        with pytest.raises(RuntimeError, match="At least one data source"):
             qc.app()
 
     def test_express_allows_deferred_data_source_during_stub_session(self):
@@ -82,6 +94,7 @@ def test_server_client_override_does_not_mutate_shared_client_spec(
         init_client = ChatOpenAI(model="gpt-4.1")
         override_client = ChatOpenAI(model="gpt-4.1-mini")
         qc = QueryChat(None, "users", client=init_client)
+        qc.add_table(sample_df, "users")
         recorded_specs = []
         real_create_client = _create_client
 
@@ -94,7 +107,7 @@ def spy_create_client(client_spec):
         )
 
         with session_context(ExpressStubSession()):
-            vals = qc.server(data_source=sample_df, client=override_client)
+            vals = qc.server(client=override_client)
 
         assert isinstance(vals.client, chatlas.Chat)
         assert len(recorded_specs) == 1
@@ -107,11 +120,196 @@ def test_multiple_server_overrides_do_not_leak_into_shared_state(self, sample_df
         first_override = ChatOpenAI(model="gpt-4.1-mini")
         second_override = ChatOpenAI(model="gpt-4.1-nano")
         qc = QueryChat(None, "users", client=init_client)
+        qc.add_table(sample_df, "users")
 
         with session_context(ExpressStubSession()):
-            qc.server(data_source=sample_df, client=first_override)
+            qc.server(client=first_override)
+
+        # Reset server_initialized for sequential test
+        qc._server_initialized = False
 
         with session_context(ExpressStubSession()):
-            qc.server(data_source=sample_df, client=second_override)
+            qc.server(client=second_override)
 
         assert qc._client_spec is init_client
+
+
+class TestExpressMultiTable:
+    """Tests for multi-table support in QueryChatExpress."""
+
+    @pytest.fixture
+    def orders_df(self):
+        return pd.DataFrame({"id": [1, 2], "amount": [100.0, 200.0]})
+
+    @pytest.fixture
+    def customers_df(self):
+        return pd.DataFrame({"id": [101, 102], "name": ["Alice", "Bob"]})
+
+    def test_add_table_does_not_raise_after_init_stub_session(
+        self, orders_df, customers_df
+    ):
+        """add_table() must succeed after __init__ during stub session."""
+        with session_context(ExpressStubSession()):
+            qc = ExpressQueryChat(orders_df, "orders")
+            # Without the fix, _server_initialized would be True here and
+            # add_table() would raise RuntimeError.
+            qc.add_table(customers_df, "customers")
+
+        assert qc.table_names() == ["orders", "customers"]
+
+    def test_server_not_initialized_after_init_stub_session(self, orders_df):
+        """_server_initialized must remain False after __init__ in stub session."""
+        with session_context(ExpressStubSession()):
+            qc = ExpressQueryChat(orders_df, "orders")
+            assert not qc._server_initialized
+
+    def test_ensure_server_started_noop_during_stub_session(
+        self, orders_df, monkeypatch
+    ):
+        """_ensure_server_started() must be a no-op during the stub session."""
+        called = []
+
+        def spy_mod_server(*args, **kwargs):
+            called.append(True)
+
+        monkeypatch.setattr("querychat._shiny.mod_server", spy_mod_server)
+
+        with session_context(ExpressStubSession()):
+            qc = ExpressQueryChat(orders_df, "orders")
+            qc._ensure_server_started()
+
+        assert not called, "mod_server should not be called during stub session"
+
+    def test_ensure_server_started_starts_server_in_real_session(
+        self, orders_df, monkeypatch
+    ):
+        """_ensure_server_started() starts the server exactly once in a real session."""
+        called = []
+
+        def fake_mod_server(*args, **kwargs):
+            called.append((args, kwargs))
+            return MagicMock()
+
+        monkeypatch.setattr("querychat._shiny.mod_server", fake_mod_server)
+
+        mock_session = MagicMock()
+        mock_session.ns = Root
+        with session_context(mock_session):
+            qc = ExpressQueryChat(orders_df, "orders")
+            assert not qc._server_initialized
+            qc._ensure_server_started()
+
+        assert len(called) == 1
+        assert qc._server_initialized
+
+    def test_ensure_server_started_idempotent(self, orders_df, monkeypatch):
+        """_ensure_server_started() called twice starts server only once."""
+        called = []
+
+        def fake_mod_server(*args, **kwargs):
+            called.append(True)
+            return MagicMock()
+
+        monkeypatch.setattr("querychat._shiny.mod_server", fake_mod_server)
+
+        mock_session = MagicMock()
+        mock_session.ns = Root
+        with session_context(mock_session):
+            qc = ExpressQueryChat(orders_df, "orders")
+            qc._ensure_server_started()
+            qc._ensure_server_started()
+
+        assert len(called) == 1
+
+    def test_add_table_after_init_then_server_started_in_real_session(
+        self, orders_df, customers_df, monkeypatch
+    ):
+        """Full Express multi-table flow: init → add_table → ensure_server_started."""
+        started_with_sources: list[list[str]] = []
+
+        def fake_mod_server(*args, **kwargs):
+            started_with_sources.append(list(kwargs["data_sources"].keys()))
+            return MagicMock()
+
+        monkeypatch.setattr("querychat._shiny.mod_server", fake_mod_server)
+
+        mock_session = MagicMock()
+        mock_session.ns = Root
+        with session_context(mock_session):
+            qc = ExpressQueryChat(orders_df, "orders")
+            qc.add_table(customers_df, "customers")
+            qc._ensure_server_started()
+
+        assert started_with_sources == [["orders", "customers"]]
+
+    def test_table_delegates_to_vals(self, orders_df, customers_df, monkeypatch):
+        """table() should delegate to _vals.table() and return its result."""
+        fake_accessor = MagicMock()
+        fake_vals = MagicMock()
+        fake_vals.table.return_value = fake_accessor
+
+        monkeypatch.setattr("querychat._shiny.mod_server", lambda *a, **kw: fake_vals)
+
+        mock_session = MagicMock()
+        mock_session.ns = Root
+        with session_context(mock_session):
+            qc = ExpressQueryChat(orders_df, "orders")
+            qc.add_table(customers_df, "customers")
+            result = qc.table("orders")
+
+        fake_vals.table.assert_called_once_with("orders")
+        assert result is fake_accessor
+
+    def test_table_unknown_name_propagates_error(
+        self, orders_df, customers_df, monkeypatch
+    ):
+        """table() with an unknown name should propagate ValueError from ServerValues."""
+        fake_vals = MagicMock()
+        fake_vals.table.side_effect = ValueError("'foo' not found")
+
+        monkeypatch.setattr("querychat._shiny.mod_server", lambda *a, **kw: fake_vals)
+
+        mock_session = MagicMock()
+        mock_session.ns = Root
+        with session_context(mock_session):
+            qc = ExpressQueryChat(orders_df, "orders")
+            qc.add_table(customers_df, "customers")
+            with pytest.raises(ValueError, match="not found"):
+                qc.table("foo")
+
+    def test_current_table_delegates_to_vals(
+        self, orders_df, customers_df, monkeypatch
+    ):
+        """current_table() should delegate to _vals.current_table()."""
+        fake_vals = MagicMock()
+        fake_vals.current_table.return_value = "customers"
+
+        monkeypatch.setattr("querychat._shiny.mod_server", lambda *a, **kw: fake_vals)
+
+        mock_session = MagicMock()
+        mock_session.ns = Root
+        with session_context(mock_session):
+            qc = ExpressQueryChat(orders_df, "orders")
+            qc.add_table(customers_df, "customers")
+            result = qc.current_table()
+
+        fake_vals.current_table.assert_called_once()
+        assert result == "customers"
+
+    def test_current_table_returns_none_before_any_query(
+        self, orders_df, customers_df, monkeypatch
+    ):
+        """current_table() returns None when no query has been run yet."""
+        fake_vals = MagicMock()
+        fake_vals.current_table.return_value = None
+
+        monkeypatch.setattr("querychat._shiny.mod_server", lambda *a, **kw: fake_vals)
+
+        mock_session = MagicMock()
+        mock_session.ns = Root
+        with session_context(mock_session):
+            qc = ExpressQueryChat(orders_df, "orders")
+            qc.add_table(customers_df, "customers")
+            result = qc.current_table()
+
+        assert result is None
diff --git a/pkg-py/tests/test_frameworks.py b/pkg-py/tests/test_frameworks.py
index 52e41ea47..1b554657b 100644
--- a/pkg-py/tests/test_frameworks.py
+++ b/pkg-py/tests/test_frameworks.py
@@ -37,7 +37,7 @@ def test_instantiation(self, sample_df):
 
         qc = QueryChat(sample_df, "tips")
         assert qc is not None
-        assert qc.data_source is not None
+        assert len(qc.table_names()) > 0
 
     def test_app_returns_blocks(self, sample_df):
         from querychat.gradio import QueryChat
@@ -56,6 +56,35 @@ def test_ui_returns_state(self, sample_df):
             result = qc.ui()
         assert isinstance(result, gr.State)
 
+    def test_app_uses_active_table_for_fallback_sql_display(self):
+        import pandas as pd
+        from querychat.gradio import QueryChat
+
+        qc = QueryChat(pd.DataFrame({"id": [1, 2], "amount": [10, 20]}), "orders")
+        qc.add_table(pd.DataFrame({"id": [101, 102], "state": ["CA", "NY"]}), "customers")
+
+        app = qc.app()._blocks
+        update_displays = next(
+            block_fn.fn
+            for block_fn in app.fns.values()
+            if getattr(block_fn.fn, "__name__", "") == "update_displays"
+        )
+
+        _, sql_code, native_df, data_info_text = update_displays(
+            {
+                "table": "customers",
+                "sql": None,
+                "title": None,
+                "error": "Query syntax error: missing column",
+                "turns": [],
+            }
+        )
+
+        assert sql_code == "SELECT * FROM customers"
+        assert native_df["id"].tolist() == [101, 102]
+        assert native_df["state"].tolist() == ["CA", "NY"]
+        assert "⚠️ Query syntax error: missing column" in data_info_text
+
 
 class TestDashQueryChat:
     @pytest.fixture(autouse=True)
@@ -72,7 +101,7 @@ def test_instantiation(self, sample_df):
 
         qc = QueryChat(sample_df, "tips")
         assert qc is not None
-        assert qc.data_source is not None
+        assert len(qc.table_names()) > 0
 
     def test_app_returns_dash_app(self, sample_df):
         from querychat.dash import QueryChat
@@ -154,7 +183,7 @@ def test_instantiation(self, sample_df):
 
         qc = QueryChat(sample_df, "tips")
         assert qc is not None
-        assert qc.data_source is not None
+        assert len(qc.table_names()) > 0
 
     def test_system_prompt_generated(self, sample_df):
         from querychat.streamlit import QueryChat
@@ -191,6 +220,6 @@ def test_data_source_accessible(self, sample_df):
         from querychat.streamlit import QueryChat
 
         qc = QueryChat(sample_df, "tips")
-        ds = qc.data_source
+        ds = qc.table("tips").data_source
         assert ds is not None
         assert ds.table_name == "tips"
diff --git a/pkg-py/tests/test_multi_table.py b/pkg-py/tests/test_multi_table.py
new file mode 100644
index 000000000..7e634c52c
--- /dev/null
+++ b/pkg-py/tests/test_multi_table.py
@@ -0,0 +1,1081 @@
+"""Tests for multi-table support."""
+
+import os
+import tempfile
+from pathlib import Path
+from unittest.mock import patch
+
+import pandas as pd
+import polars as pl
+import pytest
+from querychat import QueryChat
+from querychat._datasource import DataFrameSource
+from querychat._query_executor import (
+    DataSourceExecutor,
+    DuckDBExecutor,
+    check_source_compatibility,
+)
+from querychat._querychat_base import QueryChatBase, normalize_data_source
+from sqlalchemy import create_engine, text
+
+
+@pytest.fixture(autouse=True)
+def set_dummy_api_key():
+    """Set a dummy OpenAI API key for testing."""
+    old_api_key = os.environ.get("OPENAI_API_KEY")
+    os.environ["OPENAI_API_KEY"] = "sk-dummy-api-key-for-testing"
+    yield
+    if old_api_key is not None:
+        os.environ["OPENAI_API_KEY"] = old_api_key
+    else:
+        del os.environ["OPENAI_API_KEY"]
+
+
+@pytest.fixture
+def orders_df():
+    """Sample orders DataFrame."""
+    return pd.DataFrame(
+        {
+            "id": [1, 2, 3],
+            "customer_id": [101, 102, 101],
+            "amount": [100.0, 200.0, 150.0],
+        }
+    )
+
+
+@pytest.fixture
+def customers_df():
+    """Sample customers DataFrame."""
+    return pd.DataFrame(
+        {
+            "id": [101, 102, 103],
+            "name": ["Alice", "Bob", "Charlie"],
+            "state": ["CA", "NY", "CA"],
+        }
+    )
+
+
+@pytest.fixture
+def shared_sqlite_engine():
+    """SQLite engine with orders/customers tables for shared-engine tests."""
+    temp_db = tempfile.NamedTemporaryFile(delete=False, suffix=".db")  # noqa: SIM115
+    temp_db.close()
+    engine = create_engine(f"sqlite:///{temp_db.name}")
+
+    with engine.begin() as conn:
+        conn.execute(text("""
+            CREATE TABLE orders (
+                id INTEGER,
+                customer_id INTEGER,
+                amount REAL
+            )
+        """))
+        conn.execute(text("""
+            CREATE TABLE customers (
+                id INTEGER,
+                name TEXT
+            )
+        """))
+        conn.execute(
+            text("""
+                INSERT INTO orders (id, customer_id, amount)
+                VALUES
+                    (1, 101, 100.0),
+                    (2, 102, 200.0)
+            """)
+        )
+        conn.execute(
+            text("""
+                INSERT INTO customers (id, name)
+                VALUES
+                    (101, 'Alice'),
+                    (102, 'Bob')
+            """)
+        )
+
+    yield engine
+
+    engine.dispose()
+    Path(temp_db.name).unlink()
+
+
+@pytest.fixture
+def ibis_tables():
+    """Ibis tables with shared backend for compatibility tests."""
+    ibis = pytest.importorskip("ibis")
+    conn = ibis.duckdb.connect()
+    conn.create_table(
+        "orders",
+        {
+            "id": [1, 2],
+            "customer_id": [101, 102],
+            "amount": [100.0, 200.0],
+        },
+    )
+    conn.create_table(
+        "customers",
+        {
+            "id": [101, 102],
+            "name": ["Alice", "Bob"],
+        },
+    )
+
+    yield {
+        "orders": conn.table("orders"),
+        "customers": conn.table("customers"),
+    }
+
+    conn.disconnect()
+
+
+@pytest.fixture
+def other_ibis_orders_table():
+    """Ibis orders table backed by a different backend instance."""
+    ibis = pytest.importorskip("ibis")
+    conn = ibis.duckdb.connect()
+    conn.create_table(
+        "orders",
+        {
+            "id": [1, 2],
+            "customer_id": [101, 102],
+            "amount": [100.0, 200.0],
+        },
+    )
+
+    yield conn.table("orders")
+
+    conn.disconnect()
+
+
+class TestNoArgConstruction:
+    """Tests for QueryChatBase() / QueryChat() with no positional arguments."""
+
+    def test_no_arg_construction(self):
+        qc = QueryChatBase()
+        assert qc.table_names() == []
+
+    def test_no_arg_construction_multi_table(self, orders_df, customers_df):
+        qc = QueryChatBase()
+        qc.add_table(orders_df, "orders")
+        qc.add_table(customers_df, "customers")
+        assert qc.table_names() == ["orders", "customers"]
+
+
+class TestMultiSourceStorage:
+    """Tests for multi-source storage infrastructure."""
+
+    def test_single_table_stored_in_data_sources(self, orders_df):
+        """Test that single table is stored in _data_sources dict."""
+        qc = QueryChat(orders_df, "orders", greeting="Hello!")
+
+        # Should have _data_sources dict with one entry
+        assert hasattr(qc, "_data_sources")
+        assert isinstance(qc._data_sources, dict)
+        assert "orders" in qc._data_sources
+        assert len(qc._data_sources) == 1
+
+    def test_table_names_returns_list(self, orders_df):
+        """Test that table_names() returns list of table names."""
+        qc = QueryChat(orders_df, "orders", greeting="Hello!")
+
+        names = qc.table_names()
+
+        assert names == ["orders"]
+
+
+class TestAddTable:
+    """Tests for add_table() method."""
+
+    def test_add_table_basic(self, orders_df, customers_df):
+        """Test adding a second table."""
+        qc = QueryChat(orders_df, "orders", greeting="Hello!")
+        qc.add_table(customers_df, "customers")
+
+        assert qc.table_names() == ["orders", "customers"]
+        assert len(qc._data_sources) == 2
+
+    def test_add_table_duplicate_name_raises(self, orders_df):
+        """Test that adding duplicate table name raises error."""
+        qc = QueryChat(orders_df, "orders", greeting="Hello!")
+
+        with pytest.raises(ValueError, match="Table 'orders' already exists"):
+            qc.add_table(orders_df, "orders")
+
+    def test_add_table_invalid_name_raises(self, orders_df, customers_df):
+        """Test that invalid table name raises error."""
+        qc = QueryChat(orders_df, "orders", greeting="Hello!")
+
+        with pytest.raises(ValueError, match="must begin with a letter"):
+            qc.add_table(customers_df, "123invalid")
+
+    def test_add_table_after_server_raises(self, orders_df, customers_df):
+        """Test that adding table after server init raises error."""
+        qc = QueryChat(orders_df, "orders", greeting="Hello!")
+        qc._server_initialized = True  # Simulate server initialization
+
+        with pytest.raises(RuntimeError, match="Cannot add tables after server"):
+            qc.add_table(customers_df, "customers")
+
+
+class TestRemoveTable:
+    """Tests for remove_table() method."""
+
+    def test_remove_table_basic(self, orders_df, customers_df):
+        """Test removing a table."""
+        qc = QueryChat(orders_df, "orders", greeting="Hello!")
+        qc.add_table(customers_df, "customers")
+
+        qc.remove_table("customers")
+
+        assert qc.table_names() == ["orders"]
+
+    def test_remove_table_nonexistent_raises(self, orders_df):
+        """Test that removing nonexistent table raises error."""
+        qc = QueryChat(orders_df, "orders", greeting="Hello!")
+
+        with pytest.raises(ValueError, match="Table 'foo' not found"):
+            qc.remove_table("foo")
+
+    def test_remove_last_table_raises(self, orders_df):
+        """Test that removing last table raises error."""
+        qc = QueryChat(orders_df, "orders", greeting="Hello!")
+
+        with pytest.raises(ValueError, match="Cannot remove last table"):
+            qc.remove_table("orders")
+
+    def test_remove_table_after_server_raises(self, orders_df, customers_df):
+        """Test that removing table after server init raises error."""
+        qc = QueryChat(orders_df, "orders", greeting="Hello!")
+        qc.add_table(customers_df, "customers")
+        qc._server_initialized = True
+
+        with pytest.raises(RuntimeError, match="Cannot remove tables after server"):
+            qc.remove_table("customers")
+
+
+class TestTableAccessor:
+    """Tests for table() method and TableAccessor class."""
+
+
+
+class TestMultiTableSystemPrompt:
+    """Tests for multi-table system prompt generation."""
+
+    def test_multiple_schemas_in_prompt(self, orders_df, customers_df):
+        """Test that multiple table schemas appear in prompt."""
+        qc = QueryChat(orders_df, "orders", greeting="Hello!")
+        qc.add_table(customers_df, "customers")
+
+        prompt = qc.system_prompt
+
+        assert "orders" in prompt
+        assert "customers" in prompt
+
+    def test_system_prompt_references_get_schema_tool(self, orders_df, customers_df):
+        """Column details are now behind get_schema; prompt lists table names only."""
+        qc = QueryChat(orders_df, "orders", greeting="Hello!")
+        qc.add_table(customers_df, "customers")
+
+        prompt = qc.system_prompt
+
+        # Table names still appear in the prompt
+        assert "orders" in prompt
+        assert "customers" in prompt
+        # Column details are no longer inlined in the prompt
+        assert "querychat_get_schema" in prompt
+
+
+class TestMultiTableCleanup:
+    """Tests for cleanup of multiple data sources."""
+
+    def test_cleanup_all_sources(self, orders_df, customers_df):
+        """Test that cleanup() cleans up all data sources."""
+        qc = QueryChat(orders_df, "orders", greeting="Hello!")
+        qc.add_table(customers_df, "customers")
+
+        # Both sources should have connections before cleanup
+        assert qc._data_sources["orders"]._conn is not None
+        assert qc._data_sources["customers"]._conn is not None
+
+        qc.cleanup()
+
+        # Connections should be closed after cleanup
+        # (DuckDB connections don't have is_closed, but they're closed)
+
+
+@pytest.fixture
+def orders_qc(orders_df):
+    """QueryChat with a single orders table."""
+    return QueryChat(orders_df, "orders", greeting="Hello!")
+
+
+class TestSourceCompatibility:
+    def test_same_pandas_compatible(self, orders_qc, customers_df):
+        """Two pandas DataFrameSources are compatible."""
+        first = orders_qc._data_sources["orders"]
+        second = normalize_data_source(customers_df, "customers")
+        # Should not raise
+        check_source_compatibility({"orders": first}, second, "customers")
+
+    def test_mixed_pandas_polars_incompatible(self, orders_qc):
+        """Pandas and Polars DataFrameSources are incompatible."""
+        first = orders_qc._data_sources["orders"]
+        polars_df = pl.DataFrame({"x": [1, 2]})
+        second = normalize_data_source(polars_df, "other")
+        with pytest.raises(ValueError, match="same DataFrame backend"):
+            check_source_compatibility({"orders": first}, second, "other")
+
+    def test_different_source_types_incompatible(self, orders_qc):
+        """DataFrameSource and PolarsLazySource are incompatible."""
+        first = orders_qc._data_sources["orders"]
+        lf = pl.LazyFrame({"x": [1, 2]})
+        second = normalize_data_source(lf, "lazy_table")
+        with pytest.raises(ValueError, match="same type"):
+            check_source_compatibility({"orders": first}, second, "lazy_table")
+
+    def test_add_table_validates_compatibility(self, orders_qc):
+        """add_table should reject incompatible source types."""
+        lf = pl.LazyFrame({"x": [1, 2]})
+        with pytest.raises(ValueError, match="same type"):
+            orders_qc.add_table(lf, "lazy_table")
+
+    def test_shared_sqlalchemy_engine_compatible(self, shared_sqlite_engine):
+        """SQLAlchemy sources sharing an Engine instance are compatible."""
+        first = normalize_data_source(shared_sqlite_engine, "orders")
+        second = normalize_data_source(shared_sqlite_engine, "customers")
+
+        check_source_compatibility({"orders": first}, second, "customers")
+
+    def test_mismatched_sqlalchemy_engines_incompatible(self, shared_sqlite_engine):
+        """SQLAlchemy sources using different Engine instances are incompatible."""
+        temp_db = tempfile.NamedTemporaryFile(delete=False, suffix=".db")  # noqa: SIM115
+        temp_db.close()
+        other_engine = create_engine(f"sqlite:///{temp_db.name}")
+        try:
+            with other_engine.begin() as conn:
+                conn.execute(text("CREATE TABLE customers (id INTEGER, name TEXT)"))
+
+            first = normalize_data_source(shared_sqlite_engine, "orders")
+            second = normalize_data_source(other_engine, "customers")
+
+            with pytest.raises(ValueError, match="share the same Engine instance"):
+                check_source_compatibility({"orders": first}, second, "customers")
+        finally:
+            other_engine.dispose()
+            Path(temp_db.name).unlink()
+
+    def test_shared_ibis_backend_compatible(self, ibis_tables):
+        """Ibis sources sharing a backend instance are compatible."""
+        first = normalize_data_source(ibis_tables["orders"], "orders")
+        second = normalize_data_source(ibis_tables["customers"], "customers")
+
+        check_source_compatibility({"orders": first}, second, "customers")
+
+    def test_mismatched_ibis_backends_incompatible(
+        self, ibis_tables, other_ibis_orders_table
+    ):
+        """Ibis sources using different backend instances are incompatible."""
+        first = normalize_data_source(ibis_tables["orders"], "orders")
+        second = normalize_data_source(other_ibis_orders_table, "customers")
+
+        with pytest.raises(ValueError, match="share the same backend instance"):
+            check_source_compatibility({"orders": first}, second, "customers")
+
+    def test_add_table_replace_validates_compatibility(
+        self, orders_qc, customers_df
+    ):
+        """Replacing a table must still respect multi-table compatibility."""
+        orders_qc.add_table(customers_df, "customers")
+        original_orders = orders_qc._data_sources["orders"]
+
+        with pytest.raises(ValueError, match="same DataFrame backend"):
+            orders_qc.add_table(
+                pl.DataFrame(
+                    {
+                        "id": [1, 2],
+                        "customer_id": [101, 102],
+                        "amount": [100.0, 200.0],
+                    }
+                ),
+                "orders",
+                replace=True,
+            )
+
+        assert orders_qc._data_sources["orders"] is original_orders
+        assert isinstance(orders_qc._data_sources["orders"].get_data(), pd.DataFrame)
+
+
+class TestBuildQueryExecutor:
+    def test_executor_none_before_first_use(self, orders_qc):
+        assert orders_qc._query_executor is None
+
+    def test_single_table_uses_data_source_executor(self, orders_qc):
+        assert isinstance(orders_qc._require_query_executor("test"), DataSourceExecutor)
+
+    def test_multi_dataframe_uses_duckdb_executor(self, orders_qc, customers_df):
+        orders_qc.add_table(customers_df, "customers")
+        assert isinstance(orders_qc._require_query_executor("test"), DuckDBExecutor)
+
+    def test_executor_invalidated_on_add_table(self, orders_qc, customers_df):
+        orders_qc._require_query_executor("test")  # build it
+        orders_qc.add_table(customers_df, "customers")
+        assert orders_qc._query_executor is None
+
+    def test_executor_invalidated_on_remove_table(self, orders_qc, customers_df):
+        orders_qc.add_table(customers_df, "customers")
+        orders_qc._require_query_executor("test")  # build it
+        orders_qc.remove_table("customers")
+        assert orders_qc._query_executor is None
+
+    def test_executor_cached_after_build(self, orders_qc):
+        first = orders_qc._require_query_executor("test")
+        second = orders_qc._require_query_executor("test")
+        assert first is second
+
+    def test_cleanup_includes_executor(self, orders_qc, customers_df):
+        orders_qc.add_table(customers_df, "customers")
+        executor = orders_qc._require_query_executor("test")
+        orders_qc.cleanup()
+        # DuckDBExecutor's connection should be closed
+        import duckdb
+
+        with pytest.raises(duckdb.ConnectionException):
+            executor.execute_query("SELECT 1")
+
+    def test_deferred_executor_is_none(self):
+        qc = QueryChatBase(None, "test")
+        assert qc._query_executor is None
+
+    def test_rejects_inconsistent_internal_source_group(self, orders_qc):
+        orders_qc._data_sources["customers"] = normalize_data_source(
+            pl.DataFrame(
+                {
+                    "id": [101, 102],
+                    "name": ["Alice", "Bob"],
+                }
+            ),
+            "customers",
+        )
+
+        with pytest.raises(ValueError, match="same DataFrame backend"):
+            orders_qc._build_query_executor()
+
+    def test_cached_executor_survives_direct_source_mutation(self, orders_qc, customers_df):
+        """Executor built lazily is not invalidated by direct _data_sources mutation."""
+        orders_qc.add_table(customers_df, "customers")
+        built = orders_qc._require_query_executor("test")
+
+        # Directly corrupt _data_sources (bypassing add_table) — executor should
+        # not be affected since invalidation only happens through add/remove_table.
+        orders_qc._data_sources["customers"] = normalize_data_source(
+            pl.DataFrame({"id": [101, 102], "name": ["Alice", "Bob"]}),
+            "customers",
+        )
+
+        assert orders_qc._query_executor is built
+        result = built.execute_query(
+            """
+            SELECT customers.name, orders.amount
+            FROM orders
+            JOIN customers ON orders.customer_id = customers.id
+            WHERE orders.id = 1
+            """
+        )
+        assert result.to_dict("records") == [{"name": "Alice", "amount": 100.0}]
+
+    def test_add_table_failure_cleans_staged_source_and_preserves_state(
+        self, orders_qc, customers_df, monkeypatch
+    ):
+        original_table_names = orders_qc.table_names()
+        staged_source = None
+
+        original_normalize = normalize_data_source
+
+        def capture_staged_source(data_source, table_name):
+            nonlocal staged_source
+            staged_source = original_normalize(data_source, table_name)
+            return staged_source
+
+        monkeypatch.setattr(
+            "querychat._querychat_base.normalize_data_source",
+            capture_staged_source,
+        )
+        def fail_compat(*a, **kw):
+            raise ValueError("compat check failed")
+
+        monkeypatch.setattr(
+            "querychat._querychat_base.check_source_compatibility",
+            fail_compat,
+        )
+
+        with pytest.raises(ValueError, match="compat check failed"):
+            orders_qc.add_table(customers_df, "customers")
+
+        import duckdb
+
+        assert isinstance(staged_source, DataFrameSource)
+        with pytest.raises(duckdb.ConnectionException):
+            staged_source.execute_query("SELECT 1")
+        assert orders_qc.table_names() == original_table_names
+
+    def test_add_table_replace_failure_cleans_staged_source_and_preserves_state(
+        self, orders_qc, customers_df, monkeypatch
+    ):
+        orders_qc.add_table(customers_df, "customers")
+        original_orders_source = orders_qc._data_sources["orders"]
+        original_table_names = orders_qc.table_names()
+        staged_source = None
+
+        original_normalize = normalize_data_source
+
+        def capture_staged_source(data_source, table_name):
+            nonlocal staged_source
+            staged_source = original_normalize(data_source, table_name)
+            return staged_source
+
+        monkeypatch.setattr(
+            "querychat._querychat_base.normalize_data_source",
+            capture_staged_source,
+        )
+        def fail_compat(*a, **kw):
+            raise ValueError("compat check failed")
+
+        monkeypatch.setattr(
+            "querychat._querychat_base.check_source_compatibility",
+            fail_compat,
+        )
+
+        with pytest.raises(ValueError, match="compat check failed"):
+            orders_qc.add_table(
+                pd.DataFrame(
+                    {
+                        "id": [1, 2, 3],
+                        "customer_id": [101, 102, 101],
+                        "amount": [100.0, 200.0, 150.0],
+                    }
+                ),
+                "orders",
+                replace=True,
+            )
+
+        import duckdb
+
+        assert isinstance(staged_source, DataFrameSource)
+        assert staged_source is not original_orders_source
+        with pytest.raises(duckdb.ConnectionException):
+            staged_source.execute_query("SELECT 1")
+        assert orders_qc._data_sources["orders"] is original_orders_source
+        assert orders_qc.table_names() == original_table_names
+
+    def test_remove_table_cleans_up_removed_source(self, orders_qc, customers_df):
+        orders_qc.add_table(customers_df, "customers")
+        customer_source = orders_qc._data_sources["customers"]
+
+        orders_qc.remove_table("customers")
+
+        assert orders_qc.table_names() == ["orders"]
+        import duckdb
+
+        with pytest.raises(duckdb.ConnectionException):
+            customer_source.execute_query("SELECT id FROM customers")
+
+
+class TestMultiTableGuardrails:
+    """Top-level flat accessors warn and delegate to the primary table with multiple tables."""
+
+    def test_shiny_server_values_flat_accessor_warns(self, orders_df, customers_df):
+        import warnings
+
+        from querychat._shiny_module import (
+            ServerValues,
+            TableState,
+            _MultiTableWarnReactive,
+        )
+
+        from shiny import reactive
+
+        orders_sql: reactive.Value[str | None] = reactive.Value(None)
+        orders_title: reactive.Value[str | None] = reactive.Value(None)
+        customers_sql: reactive.Value[str | None] = reactive.Value(None)
+        customers_title: reactive.Value[str | None] = reactive.Value(None)
+
+        table_list = "'orders', 'customers'"
+        vals = ServerValues(
+            df=lambda: orders_df,
+            sql=_MultiTableWarnReactive(orders_sql, "sql", "orders", table_list),  # type: ignore[arg-type]
+            title=_MultiTableWarnReactive(orders_title, "title", "orders", table_list),  # type: ignore[arg-type]
+            tables={
+                "orders": TableState(sql=orders_sql, title=orders_title, df=lambda: orders_df),
+                "customers": TableState(sql=customers_sql, title=customers_title, df=lambda: customers_df),
+            },
+            client=None,  # type: ignore[arg-type]
+            data_sources={},
+            current_table=reactive.Value(None),
+        )
+
+        # First access warns and delegates to primary table
+        with reactive.isolate(), pytest.warns(FutureWarning, match="multiple tables"):
+            result = vals.sql()
+        assert result is None  # primary table has no SQL set
+
+        # Subsequent accesses on the same instance don't re-warn
+        with reactive.isolate(), warnings.catch_warnings():
+            warnings.simplefilter("error")
+            assert vals.sql.get() is None
+
+        # .set() delegates to the primary reactive
+        vals.sql.set("SELECT 1")
+        with reactive.isolate():
+            assert orders_sql.get() == "SELECT 1"
+
+        # title is a separate instance — first access warns independently
+        with reactive.isolate(), pytest.warns(FutureWarning, match="multiple tables"):
+            assert vals.title() is None
+
+    def test_shiny_server_values_tables_still_works(self, orders_df, customers_df):
+        from querychat._shiny_module import (
+            ServerValues,
+            TableState,
+            _MultiTableWarnReactive,
+        )
+
+        from shiny import reactive
+
+        orders_sql: reactive.Value[str | None] = reactive.Value(None)
+        orders_title: reactive.Value[str | None] = reactive.Value(None)
+        customers_sql: reactive.Value[str | None] = reactive.Value(None)
+        customers_title: reactive.Value[str | None] = reactive.Value(None)
+
+        table_list = "'orders', 'customers'"
+        vals = ServerValues(
+            df=lambda: None,  # type: ignore[return-value]
+            sql=_MultiTableWarnReactive(orders_sql, "sql", "orders", table_list),  # type: ignore[arg-type]
+            title=_MultiTableWarnReactive(orders_title, "title", "orders", table_list),  # type: ignore[arg-type]
+            tables={
+                "orders": TableState(sql=orders_sql, title=orders_title, df=lambda: orders_df),
+                "customers": TableState(sql=customers_sql, title=customers_title, df=lambda: customers_df),
+            },
+            client=None,  # type: ignore[arg-type]
+            data_sources={},
+            current_table=reactive.Value(None),
+        )
+
+        orders_state = vals._tables["orders"]
+        assert orders_state.df() is orders_df
+        customers_state = vals._tables["customers"]
+        assert customers_state.df() is customers_df
+
+    def test_server_values_table_names(self, orders_df, customers_df):
+        from querychat._querychat_base import normalize_data_source
+        from querychat._shiny_module import (
+            ServerValues,
+            TableState,
+            _MultiTableWarnReactive,
+        )
+
+        from shiny import reactive
+
+        orders_source = normalize_data_source(orders_df, "orders")
+        customers_source = normalize_data_source(customers_df, "customers")
+        table_list = "'orders', 'customers'"
+        vals = ServerValues(
+            df=lambda: None,  # type: ignore[return-value]
+            sql=_MultiTableWarnReactive(reactive.Value(None), "sql", "orders", table_list),  # type: ignore[arg-type]
+            title=_MultiTableWarnReactive(reactive.Value(None), "title", "orders", table_list),  # type: ignore[arg-type]
+            tables={
+                "orders": TableState(sql=reactive.Value(None), title=reactive.Value(None), df=lambda: orders_df),
+                "customers": TableState(sql=reactive.Value(None), title=reactive.Value(None), df=lambda: customers_df),
+            },
+            client=None,  # type: ignore[arg-type]
+            data_sources={"orders": orders_source, "customers": customers_source},
+            current_table=reactive.Value(None),
+        )
+
+        assert vals.table_names() == ["orders", "customers"]
+
+    def test_server_values_table_accessor_df(self, orders_df, customers_df):
+        from querychat._querychat_base import normalize_data_source
+        from querychat._shiny_module import ServerValues, TableState
+        from querychat._table_accessor import TableAccessor
+
+        from shiny import reactive
+
+        orders_source = normalize_data_source(orders_df, "orders")
+        customers_source = normalize_data_source(customers_df, "customers")
+        vals = ServerValues(
+            df=lambda: orders_df,  # type: ignore[return-value]
+            sql=reactive.Value(None),
+            title=reactive.Value(None),
+            tables={
+                "orders": TableState(sql=reactive.Value(None), title=reactive.Value(None), df=lambda: orders_df),
+                "customers": TableState(sql=reactive.Value(None), title=reactive.Value(None), df=lambda: customers_df),
+            },
+            client=None,  # type: ignore[arg-type]
+            data_sources={"orders": orders_source, "customers": customers_source},
+            current_table=reactive.Value(None),
+        )
+
+        accessor = vals.table("orders")
+        assert isinstance(accessor, TableAccessor)
+        assert accessor.table_name == "orders"
+        assert accessor.df() is orders_df
+
+        customers_accessor = vals.table("customers")
+        assert customers_accessor.df() is customers_df
+
+    def test_server_values_table_unknown_raises(self, orders_df):
+        from querychat._querychat_base import normalize_data_source
+        from querychat._shiny_module import ServerValues, TableState
+
+        from shiny import reactive
+
+        orders_source = normalize_data_source(orders_df, "orders")
+        vals = ServerValues(
+            df=lambda: orders_df,  # type: ignore[return-value]
+            sql=reactive.Value(None),
+            title=reactive.Value(None),
+            tables={
+                "orders": TableState(sql=reactive.Value(None), title=reactive.Value(None), df=lambda: orders_df),
+            },
+            client=None,  # type: ignore[arg-type]
+            data_sources={"orders": orders_source},
+            current_table=reactive.Value(None),
+        )
+
+        with pytest.raises(ValueError, match="Table 'foo' not found"):
+            vals.table("foo")
+
+    def test_server_values_current_table_initially_none(self, orders_df):
+        from querychat._shiny_module import ServerValues, TableState
+
+        from shiny import reactive
+
+        vals = ServerValues(
+            df=lambda: orders_df,
+            sql=reactive.Value(None),
+            title=reactive.Value(None),
+            tables={
+                "orders": TableState(
+                    sql=reactive.Value(None),
+                    title=reactive.Value(None),
+                    df=lambda: orders_df,
+                ),
+            },
+            client=None,  # type: ignore[arg-type]
+            data_sources={},
+            current_table=reactive.Value(None),
+        )
+
+        with reactive.isolate():
+            assert vals.current_table() is None
+
+    def test_server_values_current_table_reflects_reactive(self, orders_df, customers_df):
+        from querychat._shiny_module import (
+            ServerValues,
+            TableState,
+            _MultiTableWarnReactive,
+        )
+
+        from shiny import reactive
+
+        ct_rv: reactive.Value[str | None] = reactive.Value(None)
+        table_list = "'orders', 'customers'"
+        vals = ServerValues(
+            df=lambda: None,  # type: ignore[return-value]
+            sql=_MultiTableWarnReactive(reactive.Value(None), "sql", "orders", table_list),  # type: ignore[arg-type]
+            title=_MultiTableWarnReactive(reactive.Value(None), "title", "orders", table_list),  # type: ignore[arg-type]
+            tables={
+                "orders": TableState(sql=reactive.Value(None), title=reactive.Value(None), df=lambda: orders_df),
+                "customers": TableState(sql=reactive.Value(None), title=reactive.Value(None), df=lambda: customers_df),
+            },
+            client=None,  # type: ignore[arg-type]
+            data_sources={},
+            current_table=ct_rv,
+        )
+
+        with reactive.isolate():
+            assert vals.current_table() is None
+            ct_rv.set("orders")
+            assert vals.current_table() == "orders"
+            ct_rv.set("customers")
+            assert vals.current_table() == "customers"
+
+    def test_shiny_app_works_multi_table(self, orders_df, customers_df):
+        from querychat.shiny import QueryChat
+
+        qc = QueryChat(orders_df, "orders", greeting="Hi")
+        qc.add_table(customers_df, "customers")
+        app = qc.app()
+        assert app is not None
+
+    def test_shiny_app_works_single_table(self, orders_df):
+        from querychat.shiny import QueryChat
+
+        qc = QueryChat(orders_df, "orders", greeting="Hi")
+        app = qc.app()
+        assert app is not None
+
+    def test_streamlit_app_raises_multi_table(self, orders_df, customers_df):
+        pytest.importorskip("streamlit")
+        from querychat.streamlit import QueryChat
+
+        qc = QueryChat(orders_df, "orders", greeting="Hi")
+        qc.add_table(customers_df, "customers")
+        with pytest.raises(RuntimeError, match="does not support multiple tables"):
+            qc.app()
+
+    def test_streamlit_df_raises_multi_table(self, orders_df, customers_df):
+        pytest.importorskip("streamlit")
+        from querychat.streamlit import QueryChat
+
+        qc = QueryChat(orders_df, "orders", greeting="Hi")
+        qc.add_table(customers_df, "customers")
+        with pytest.raises(AttributeError, match="multiple tables"):
+            qc.df()
+
+    def test_streamlit_sql_raises_multi_table(self, orders_df, customers_df):
+        pytest.importorskip("streamlit")
+        from querychat.streamlit import QueryChat
+
+        qc = QueryChat(orders_df, "orders", greeting="Hi")
+        qc.add_table(customers_df, "customers")
+        with pytest.raises(AttributeError, match="multiple tables"):
+            qc.sql()
+
+    def test_streamlit_title_raises_multi_table(self, orders_df, customers_df):
+        pytest.importorskip("streamlit")
+        from querychat.streamlit import QueryChat
+
+        qc = QueryChat(orders_df, "orders", greeting="Hi")
+        qc.add_table(customers_df, "customers")
+        with pytest.raises(AttributeError, match="multiple tables"):
+            qc.title()
+
+    def test_streamlit_single_table_accessor_still_works(self, orders_df, customers_df):
+        pytest.importorskip("streamlit")
+        from unittest.mock import patch
+
+        from querychat.streamlit import QueryChat
+
+        qc = QueryChat(orders_df, "orders", greeting="Hi")
+        qc.add_table(customers_df, "customers")
+        with patch("streamlit.session_state", {}):
+            result = qc.table("customers").df()
+        assert result["id"].tolist() == [101, 102, 103]
+
+    def test_state_dict_mixin_df_warns_multi_table(self, orders_df, customers_df):
+        from unittest.mock import MagicMock
+
+        from querychat import QueryChat
+        from querychat._querychat_base import StateDictQueryChat
+
+        qc = QueryChat(orders_df, "orders")
+        qc.add_table(customers_df, "customers")
+
+        class DummyAccessor(StateDictQueryChat):
+            def __init__(self):
+                self._data_sources = dict(qc._data_sources)
+                self._query_executor = qc._query_executor
+                self.greeting = None
+
+            def _require_initialized(self, _m):
+                pass
+
+            def _require_query_executor(self, _m):
+                return self._query_executor
+
+            def client(self, **_kw):
+                return MagicMock()
+
+        acc = DummyAccessor()
+        with pytest.warns(FutureWarning, match="multiple tables"):
+            result = acc.df({"sql": None, "title": None, "error": None, "turns": []})
+        assert result["id"].tolist() == [1, 2, 3]  # primary table, no filter
+
+    def test_state_dict_mixin_sql_warns_multi_table(self, orders_df, customers_df):
+        from unittest.mock import MagicMock
+
+        from querychat import QueryChat
+        from querychat._querychat_base import StateDictQueryChat
+
+        qc = QueryChat(orders_df, "orders")
+        qc.add_table(customers_df, "customers")
+
+        class DummyAccessor(StateDictQueryChat):
+            def __init__(self):
+                self._data_sources = dict(qc._data_sources)
+                self._query_executor = qc._query_executor
+                self.greeting = None
+
+            def _require_initialized(self, _m):
+                pass
+
+            def _require_query_executor(self, _m):
+                return self._query_executor
+
+            def client(self, **_kw):
+                return MagicMock()
+
+        acc = DummyAccessor()
+        state = {
+            "sql": "SELECT 1",
+            "title": None,
+            "error": None,
+            "table": "orders",
+            "table_states": {"orders": {"sql": "SELECT 1", "title": None, "error": None}},
+            "turns": [],
+        }
+        with pytest.warns(FutureWarning, match="multiple tables"):
+            result = acc.sql(state)
+        assert result == "SELECT 1"
+
+    def test_state_dict_mixin_title_warns_multi_table(self, orders_df, customers_df):
+        from unittest.mock import MagicMock
+
+        from querychat import QueryChat
+        from querychat._querychat_base import StateDictQueryChat
+
+        qc = QueryChat(orders_df, "orders")
+        qc.add_table(customers_df, "customers")
+
+        class DummyAccessor(StateDictQueryChat):
+            def __init__(self):
+                self._data_sources = dict(qc._data_sources)
+                self._query_executor = qc._query_executor
+                self.greeting = None
+
+            def _require_initialized(self, _m):
+                pass
+
+            def _require_query_executor(self, _m):
+                return self._query_executor
+
+            def client(self, **_kw):
+                return MagicMock()
+
+        acc = DummyAccessor()
+        state = {
+            "sql": None,
+            "title": None,
+            "error": None,
+            "table": "orders",
+            "table_states": {"orders": {"sql": None, "title": "Big orders", "error": None}},
+            "turns": [],
+        }
+        with pytest.warns(FutureWarning, match="multiple tables"):
+            result = acc.title(state)
+        assert result == "Big orders"
+
+    def test_state_dict_mixin_with_table_kwarg_still_works(self, orders_df, customers_df):
+        from unittest.mock import MagicMock
+
+        from querychat import QueryChat
+        from querychat._querychat_base import StateDictQueryChat
+
+        qc = QueryChat(orders_df, "orders")
+        qc.add_table(customers_df, "customers")
+
+        class DummyAccessor(StateDictQueryChat):
+            def __init__(self):
+                self._data_sources = dict(qc._data_sources)
+                self._query_executor = qc._query_executor
+                self.greeting = None
+
+            def _require_initialized(self, _m):
+                pass
+
+            def _require_query_executor(self, _m):
+                return self._query_executor
+
+            def client(self, **_kw):
+                return MagicMock()
+
+        acc = DummyAccessor()
+        state = {
+            "table_states": {
+                "orders": {"sql": None, "title": None, "error": None},
+                "customers": {"sql": None, "title": None, "error": None},
+            },
+            "sql": None, "title": None, "error": None, "turns": [],
+        }
+        assert acc.sql(state, table="orders") is None
+        assert acc.title(state, table="orders") is None
+
+
+class TestMultiTableQueryTool:
+    def test_client_query_tool_executes_join_against_shared_executor(
+        self, orders_df, customers_df
+    ):
+        qc = QueryChat(orders_df, "orders", greeting="Hello!")
+        qc.add_table(customers_df, "customers")
+        registered_tools = []
+
+        def capture_registered_tool(_chat, tool):
+            registered_tools.append(tool)
+
+        with patch(
+            "chatlas.Chat.register_tool",
+            autospec=True,
+            side_effect=capture_registered_tool,
+        ):
+            qc.client(tools="query")
+
+        query_tool = next(tool for tool in registered_tools if tool.name == "querychat_query")
+        result = query_tool.func(
+            """
+            SELECT customers.name, orders.amount
+            FROM orders
+            JOIN customers ON orders.customer_id = customers.id
+            WHERE orders.id = 1
+            """
+        )
+
+        assert result.error is None
+        assert result.value == [{"name": "Alice", "amount": 100.0}]
+
+
+class TestDataDictListInput:
+    """Tests for list-based data_dict input to QueryChat."""
+
+    def test_accepts_list_of_data_dicts(self, orders_df, customers_df) -> None:
+        from querychat._data_dict import DataDict, TableSpec
+
+        dd1 = DataDict(name="sales", tables={"orders": TableSpec(description="Orders")})
+        dd2 = DataDict(
+            name="people", tables={"customers": TableSpec(description="Customers")}
+        )
+        qc = QueryChat(orders_df, "orders", data_dict=[dd1, dd2])
+        qc.add_table(customers_df, "customers")
+        assert qc is not None
+
+    def test_accepts_list_of_paths(self, orders_df, customers_df, tmp_path) -> None:
+        f1 = tmp_path / "orders_dict.yaml"
+        f2 = tmp_path / "customers_dict.yaml"
+        f1.write_text('tables:\n  orders:\n    description: "Order records."\n')
+        f2.write_text('tables:\n  customers:\n    description: "Customer records."\n')
+        qc = QueryChat(orders_df, "orders", data_dict=[f1, f2])
+        qc.add_table(customers_df, "customers")
+        assert qc is not None
+
+    def test_single_data_dict_still_works(self, orders_df) -> None:
+        from querychat._data_dict import DataDict, TableSpec
+
+        dd = DataDict(name="sales", tables={"orders": TableSpec(description="Orders")})
+        qc = QueryChat(orders_df, "orders", data_dict=dd)
+        assert qc is not None
+
+    def test_list_dicts_appear_in_system_prompt(
+        self, orders_df, customers_df
+    ) -> None:
+        from querychat._data_dict import DataDict, TableSpec
+
+        dd1 = DataDict(name="sales", tables={"orders": TableSpec(description="Orders")})
+        dd2 = DataDict(
+            name="people", tables={"customers": TableSpec(description="Customers")}
+        )
+        qc = QueryChat(orders_df, "orders", data_dict=[dd1, dd2])
+        qc.add_table(customers_df, "customers")
+        qc._build_system_prompt()
+        rendered = qc._system_prompt.render(qc.tools)
+        assert 'name="sales"' in rendered
+        assert 'name="people"' in rendered
diff --git a/pkg-py/tests/test_multi_table_frameworks.py b/pkg-py/tests/test_multi_table_frameworks.py
new file mode 100644
index 000000000..d60b8336f
--- /dev/null
+++ b/pkg-py/tests/test_multi_table_frameworks.py
@@ -0,0 +1,229 @@
+"""Tests for per-table accessor API in non-Shiny frameworks."""
+
+import os
+from unittest.mock import MagicMock
+
+import pandas as pd
+import pytest
+
+
+@pytest.fixture(autouse=True)
+def set_dummy_api_key():
+    old = os.environ.get("OPENAI_API_KEY")
+    os.environ["OPENAI_API_KEY"] = "sk-dummy-api-key-for-testing"
+    yield
+    if old is not None:
+        os.environ["OPENAI_API_KEY"] = old
+    else:
+        del os.environ["OPENAI_API_KEY"]
+
+
+@pytest.fixture
+def orders_df():
+    return pd.DataFrame({"id": [1, 2, 3], "amount": [100.0, 200.0, 150.0]})
+
+
+@pytest.fixture
+def customers_df():
+    return pd.DataFrame({"id": [101, 102], "name": ["Alice", "Bob"], "state": ["CA", "NY"]})
+
+
+class TestStreamlitMultiTable:
+    @pytest.fixture(autouse=True)
+    def _skip(self):
+        pytest.importorskip("streamlit")
+
+    def _make_qc(self, orders_df, customers_df):
+        from querychat.streamlit import QueryChat
+
+        qc = QueryChat(orders_df, "orders", greeting="Hi")
+        qc.add_table(customers_df, "customers")
+        return qc
+
+    def test_table_returns_streamlit_table_accessor(self, orders_df, customers_df):
+        from querychat.streamlit import StreamlitTableAccessor
+
+        qc = self._make_qc(orders_df, customers_df)
+        acc = qc.table("orders")
+        assert isinstance(acc, StreamlitTableAccessor)
+
+    def test_table_unknown_raises(self, orders_df, customers_df):
+        qc = self._make_qc(orders_df, customers_df)
+        with pytest.raises(ValueError, match="'foo' not found"):
+            qc.table("foo")
+
+    def test_table_df_returns_full_data_when_no_filter(self, orders_df, customers_df):
+        from unittest.mock import patch
+
+        qc = self._make_qc(orders_df, customers_df)
+        fake_session = {}
+        with patch("streamlit.session_state", fake_session):
+            result = qc.table("customers").df()
+        assert result["id"].tolist() == [101, 102]
+
+    def test_table_df_applies_filter(self, orders_df, customers_df):
+        from unittest.mock import patch
+
+        qc = self._make_qc(orders_df, customers_df)
+        fake_session = {}
+        with patch("streamlit.session_state", fake_session):
+            # Simulate the LLM having set a filter for customers
+            state = qc._get_state()  # initialises session state
+            state._table_states["customers"]["sql"] = (
+                "SELECT * FROM customers WHERE state = 'CA'"
+            )
+            result = qc.table("customers").df()
+        assert result["id"].tolist() == [101]
+
+    def test_table_sql_and_title(self, orders_df, customers_df):
+        from unittest.mock import patch
+
+        qc = self._make_qc(orders_df, customers_df)
+        fake_session = {}
+        with patch("streamlit.session_state", fake_session):
+            state = qc._get_state()
+            state._table_states["orders"]["sql"] = "SELECT * FROM orders WHERE amount > 100"
+            state._table_states["orders"]["title"] = "Big orders"
+            assert qc.table("orders").sql() == "SELECT * FROM orders WHERE amount > 100"
+            assert qc.table("orders").title() == "Big orders"
+            assert qc.table("customers").sql() is None
+
+
+class TestStateDictQueryChatMultiTable:
+    """Tests for table= parameter on StateDictQueryChat."""
+
+    def _make_accessor(self, orders_df, customers_df):
+        from querychat import QueryChat
+        from querychat._querychat_base import StateDictQueryChat
+
+        qc = QueryChat(orders_df, "orders")
+        qc.add_table(customers_df, "customers")
+
+        class DummyAccessor(StateDictQueryChat):
+            def __init__(self):
+                self._data_sources = dict(qc._data_sources)
+                self._query_executor = qc._require_query_executor("test")
+                self.greeting = None
+
+            def _require_initialized(self, _m):
+                pass
+
+            def _require_query_executor(self, _m):
+                return self._query_executor
+
+            def client(self, **_kw):
+                return MagicMock()
+
+        return DummyAccessor()
+
+    def _state(self, active="orders", orders_sql=None, customers_sql=None):
+        """Build a state dict with table_states."""
+        return {
+            "table": active,
+            "sql": orders_sql if active == "orders" else customers_sql,
+            "title": None,
+            "error": None,
+            "table_states": {
+                "orders": {"sql": orders_sql, "title": None, "error": None},
+                "customers": {"sql": customers_sql, "title": None, "error": None},
+            },
+            "turns": [],
+        }
+
+    def test_df_table_kwarg_returns_specific_table_data(self, orders_df, customers_df):
+        acc = self._make_accessor(orders_df, customers_df)
+        state = self._state(
+            active="orders",
+            orders_sql="SELECT * FROM orders WHERE amount > 100",
+            customers_sql=None,
+        )
+        result = acc.df(state, table="customers")
+        # customers has no filter → full dataset
+        assert result["id"].tolist() == [101, 102]
+
+    def test_df_table_kwarg_applies_filter(self, orders_df, customers_df):
+        acc = self._make_accessor(orders_df, customers_df)
+        state = self._state(
+            active="orders",
+            customers_sql="SELECT * FROM customers WHERE state = 'CA'",
+        )
+        result = acc.df(state, table="customers")
+        assert result["id"].tolist() == [101]
+
+    def test_sql_table_kwarg(self, orders_df, customers_df):
+        acc = self._make_accessor(orders_df, customers_df)
+        state = self._state(customers_sql="SELECT * FROM customers WHERE state = 'NY'")
+        assert acc.sql(state, table="customers") == (
+            "SELECT * FROM customers WHERE state = 'NY'"
+        )
+        assert acc.sql(state, table="orders") is None
+
+    def test_title_table_kwarg(self, orders_df, customers_df):
+        acc = self._make_accessor(orders_df, customers_df)
+        state = {
+            "table": "customers",
+            "sql": None,
+            "title": None,
+            "error": None,
+            "table_states": {
+                "orders": {"sql": None, "title": "Big orders", "error": None},
+                "customers": {"sql": None, "title": None, "error": None},
+            },
+            "turns": [],
+        }
+        assert acc.title(state, table="orders") == "Big orders"
+        assert acc.title(state, table="customers") is None
+
+    def test_backward_compat_no_table_states_key(self, orders_df, customers_df):
+        """Old state dicts without table_states should still work for the active table."""
+        acc = self._make_accessor(orders_df, customers_df)
+        old_state = {
+            "table": "orders",
+            "sql": "SELECT * FROM orders WHERE amount > 100",
+            "title": "Big orders",
+            "error": None,
+            "turns": [],
+        }
+        assert acc.sql(old_state, table="orders") == (
+            "SELECT * FROM orders WHERE amount > 100"
+        )
+        assert acc.title(old_state, table="orders") == "Big orders"
+        # Non-active table with no table_states → None
+        assert acc.sql(old_state, table="customers") is None
+
+    def test_df_no_table_warns_and_returns_primary(self, orders_df, customers_df):
+        acc = self._make_accessor(orders_df, customers_df)
+        state = self._state(active="orders")
+
+        with pytest.warns(FutureWarning, match="multiple tables"):
+            result = acc.df(state)
+        # No filter on primary table → full orders dataset
+        assert result["id"].tolist() == [1, 2, 3]
+
+    def test_sql_no_table_warns_and_returns_primary(self, orders_df, customers_df):
+        acc = self._make_accessor(orders_df, customers_df)
+        state = self._state(orders_sql="SELECT * FROM orders WHERE amount > 100")
+
+        with pytest.warns(FutureWarning, match="multiple tables"):
+            result = acc.sql(state)
+        assert result == "SELECT * FROM orders WHERE amount > 100"
+
+    def test_title_no_table_warns_and_returns_primary(self, orders_df, customers_df):
+        acc = self._make_accessor(orders_df, customers_df)
+        state = {
+            "table": "orders",
+            "sql": None,
+            "title": None,
+            "error": None,
+            "table_states": {
+                "orders": {"sql": None, "title": "Big orders", "error": None},
+                "customers": {"sql": None, "title": None, "error": None},
+            },
+            "turns": [],
+        }
+
+        with pytest.warns(FutureWarning, match="multiple tables"):
+            result = acc.title(state)
+        assert result == "Big orders"
+
+
diff --git a/pkg-py/tests/test_pin_source.py b/pkg-py/tests/test_pin_source.py
index de52db338..fb39480fd 100644
--- a/pkg-py/tests/test_pin_source.py
+++ b/pkg-py/tests/test_pin_source.py
@@ -259,7 +259,7 @@ def test_explicit_description_survives_source_change(self, board, sample_df):
             data_description="Custom description",
         )
         try:
-            qc.data_source = sample_df
+            qc.add_table(sample_df, "cars", replace=True)
             prompt = qc._system_prompt.render(qc.tools)
             assert "Custom description" in prompt
             assert "Motor Trend Cars" not in prompt
@@ -278,7 +278,7 @@ def test_clears_auto_description_on_source_change(self, board, sample_df):
             prompt_before = qc._system_prompt.render(qc.tools)
             assert "Motor Trend Cars" in prompt_before
 
-            qc.data_source = sample_df
+            qc.add_table(sample_df, "cars", replace=True)
             prompt_after = qc._system_prompt.render(qc.tools)
             assert "Motor Trend Cars" not in prompt_after
         finally:
diff --git a/pkg-py/tests/test_query_executor.py b/pkg-py/tests/test_query_executor.py
new file mode 100644
index 000000000..aa38c549f
--- /dev/null
+++ b/pkg-py/tests/test_query_executor.py
@@ -0,0 +1,433 @@
+from __future__ import annotations
+
+import tempfile
+from pathlib import Path
+
+import narwhals.stable.v1 as nw
+import pandas as pd
+import polars as pl
+import pytest
+from querychat._datasource import (
+    DataFrameSource,
+    IbisSource,
+    MissingColumnsError,
+    PolarsLazySource,
+    SQLAlchemySource,
+)
+from querychat._query_executor import (
+    DataSourceExecutor,
+    DuckDBExecutor,
+    PolarsSQLExecutor,
+)
+from sqlalchemy import create_engine, text
+
+
+@pytest.fixture
+def orders_source():
+    df = pd.DataFrame({
+        "order_id": [1, 2, 3],
+        "customer_id": [10, 20, 10],
+        "amount": [100.0, 200.0, 150.0],
+    })
+    return DataFrameSource(nw.from_native(df), "orders")
+
+
+@pytest.fixture
+def customers_source():
+    df = pd.DataFrame({
+        "id": [10, 20, 30],
+        "name": ["Alice", "Bob", "Charlie"],
+    })
+    return DataFrameSource(nw.from_native(df), "customers")
+
+
+@pytest.fixture
+def sqlite_sources():
+    temp_db = tempfile.NamedTemporaryFile(delete=False, suffix=".db")  # noqa: SIM115
+    temp_db.close()
+    engine = create_engine(f"sqlite:///{temp_db.name}")
+
+    with engine.begin() as conn:
+        conn.execute(text("""
+            CREATE TABLE orders (
+                order_id INTEGER,
+                customer_id INTEGER,
+                amount REAL
+            )
+        """))
+        conn.execute(text("""
+            CREATE TABLE customers (
+                id INTEGER,
+                name TEXT
+            )
+        """))
+        conn.execute(
+            text("""
+                INSERT INTO orders (order_id, customer_id, amount)
+                VALUES
+                    (1, 10, 100.0),
+                    (2, 20, 200.0),
+                    (3, 10, 150.0)
+            """)
+        )
+        conn.execute(
+            text("""
+                INSERT INTO customers (id, name)
+                VALUES
+                    (10, 'Alice'),
+                    (20, 'Bob'),
+                    (30, 'Charlie')
+            """)
+        )
+
+    yield {
+        "orders": SQLAlchemySource(engine, "orders"),
+        "customers": SQLAlchemySource(engine, "customers"),
+    }
+
+    engine.dispose()
+    Path(temp_db.name).unlink()
+
+
+@pytest.fixture
+def ibis_sources():
+    ibis = pytest.importorskip("ibis")
+    conn = ibis.duckdb.connect()
+    conn.create_table(
+        "orders",
+        {
+            "order_id": [1, 2, 3],
+            "customer_id": [10, 20, 10],
+            "amount": [100.0, 200.0, 150.0],
+        },
+    )
+    conn.create_table(
+        "customers",
+        {
+            "id": [10, 20, 30],
+            "name": ["Alice", "Bob", "Charlie"],
+        },
+    )
+
+    yield {
+        "orders": IbisSource(conn.table("orders"), "orders"),
+        "customers": IbisSource(conn.table("customers"), "customers"),
+    }
+
+    conn.disconnect()
+
+
+@pytest.fixture
+def orders_polars_dataframe_source():
+    df = pl.DataFrame({
+        "order_id": [1, 2, 3],
+        "customer_id": [10, 20, 10],
+        "amount": [100.0, 200.0, 150.0],
+    })
+    return DataFrameSource(nw.from_native(df), "orders_polars")
+
+
+class TestDuckDBExecutor:
+    def test_cross_table_join(self, orders_source, customers_source):
+        executor = DuckDBExecutor({
+            "orders": orders_source,
+            "customers": customers_source,
+        })
+        result = executor.execute_query(
+            "SELECT o.order_id, c.name "
+            "FROM orders o JOIN customers c ON o.customer_id = c.id"
+        )
+        nw_df = nw.from_native(result, eager_only=True)
+        assert set(nw_df.columns) == {"order_id", "name"}
+        assert nw_df.shape[0] == 3
+        executor.cleanup()
+
+    def test_single_table_query(self, orders_source, customers_source):
+        executor = DuckDBExecutor({
+            "orders": orders_source,
+            "customers": customers_source,
+        })
+        result = executor.execute_query("SELECT * FROM orders WHERE amount > 100")
+        nw_df = nw.from_native(result, eager_only=True)
+        assert nw_df.shape[0] == 2
+        executor.cleanup()
+
+    def test_returns_native_type(self, orders_source):
+        executor = DuckDBExecutor({"orders": orders_source})
+        result = executor.execute_query("SELECT * FROM orders")
+        assert isinstance(result, pd.DataFrame)
+        executor.cleanup()
+
+    def test_get_db_type(self, orders_source):
+        executor = DuckDBExecutor({"orders": orders_source})
+        assert executor.get_db_type() == "DuckDB"
+        executor.cleanup()
+
+    def test_test_query_passes(self, orders_source):
+        executor = DuckDBExecutor({"orders": orders_source})
+        executor.test_query(
+            "SELECT * FROM orders",
+            table_name="orders",
+            require_all_columns=True,
+        )
+        executor.cleanup()
+
+    def test_test_query_missing_columns(self, orders_source):
+        executor = DuckDBExecutor({"orders": orders_source})
+        with pytest.raises(MissingColumnsError, match="missing required columns"):
+            executor.test_query(
+                "SELECT order_id FROM orders",
+                table_name="orders",
+                require_all_columns=True,
+            )
+        executor.cleanup()
+
+    def test_test_query_cross_table_join(self, orders_source, customers_source):
+        executor = DuckDBExecutor({
+            "orders": orders_source,
+            "customers": customers_source,
+        })
+        executor.test_query(
+            "SELECT o.* FROM orders o "
+            "JOIN customers c ON o.customer_id = c.id "
+            "WHERE c.name = 'Alice'",
+            table_name="orders",
+            require_all_columns=True,
+        )
+        executor.cleanup()
+
+    def test_unsafe_query_rejected(self, orders_source):
+        executor = DuckDBExecutor({"orders": orders_source})
+        with pytest.raises(Exception, match=r"(?i)disallowed|unsafe|not allowed"):
+            executor.execute_query("DROP TABLE orders")
+        executor.cleanup()
+
+    def test_cleanup_closes_connection(self, orders_source):
+        import duckdb
+
+        executor = DuckDBExecutor({"orders": orders_source})
+        executor.cleanup()
+        with pytest.raises(duckdb.ConnectionException):
+            executor.execute_query("SELECT 1")
+
+    def test_rejects_mixed_dataframe_backends(
+        self, orders_source, orders_polars_dataframe_source
+    ):
+        with pytest.raises(ValueError, match="same DataFrame backend"):
+            DuckDBExecutor({
+                "orders": orders_source,
+                "orders_polars": orders_polars_dataframe_source,
+            })
+
+    def test_rejects_mixed_dataframe_backends_before_opening_connection(
+        self, monkeypatch, orders_source, orders_polars_dataframe_source
+    ):
+        def fail_if_connect_called(*args, **kwargs):
+            raise AssertionError("duckdb.connect should not be called")
+
+        monkeypatch.setattr("querychat._query_executor.duckdb.connect", fail_if_connect_called)
+
+        with pytest.raises(ValueError, match="same DataFrame backend"):
+            DuckDBExecutor({
+                "orders": orders_source,
+                "orders_polars": orders_polars_dataframe_source,
+            })
+
+
+@pytest.fixture
+def orders_polars_source():
+    lf = pl.LazyFrame({
+        "order_id": [1, 2, 3],
+        "customer_id": [10, 20, 10],
+        "amount": [100.0, 200.0, 150.0],
+    })
+    return PolarsLazySource(nw.from_native(lf), "orders")
+
+
+@pytest.fixture
+def customers_polars_source():
+    lf = pl.LazyFrame({
+        "id": [10, 20, 30],
+        "name": ["Alice", "Bob", "Charlie"],
+    })
+    return PolarsLazySource(nw.from_native(lf), "customers")
+
+
+class TestPolarsSQLExecutor:
+    def test_cross_table_join(self, orders_polars_source, customers_polars_source):
+        executor = PolarsSQLExecutor({
+            "orders": orders_polars_source,
+            "customers": customers_polars_source,
+        })
+        result = executor.execute_query(
+            "SELECT o.order_id, c.name "
+            "FROM orders o JOIN customers c ON o.customer_id = c.id"
+        )
+        assert isinstance(result, pl.LazyFrame)
+        collected = result.collect()
+        assert set(collected.columns) == {"order_id", "name"}
+        assert collected.shape[0] == 3
+
+    def test_get_db_type(self, orders_polars_source):
+        executor = PolarsSQLExecutor({"orders": orders_polars_source})
+        assert executor.get_db_type() == "Polars"
+
+    def test_test_query_missing_columns(self, orders_polars_source):
+        executor = PolarsSQLExecutor({"orders": orders_polars_source})
+        with pytest.raises(MissingColumnsError, match="missing required columns"):
+            executor.test_query(
+                "SELECT order_id FROM orders",
+                table_name="orders",
+                require_all_columns=True,
+            )
+
+    def test_cleanup_noop(self, orders_polars_source):
+        executor = PolarsSQLExecutor({"orders": orders_polars_source})
+        executor.cleanup()
+
+
+class TestDataSourceExecutor:
+    def test_single_table_execute(self, orders_source):
+        executor = DataSourceExecutor({"orders": orders_source})
+        result = executor.execute_query("SELECT * FROM orders")
+        nw_df = nw.from_native(result, eager_only=True)
+        assert nw_df.shape[0] == 3
+
+    def test_get_db_type(self, orders_source):
+        executor = DataSourceExecutor({"orders": orders_source})
+        assert executor.get_db_type() == "DuckDB"
+
+    def test_test_query_routes_by_table(self, orders_source, customers_source):
+        executor = DataSourceExecutor({
+            "orders": orders_source,
+            "customers": customers_source,
+        })
+        # test_query against orders — should check orders columns
+        with pytest.raises(MissingColumnsError, match="missing required columns"):
+            executor.test_query(
+                "SELECT order_id FROM orders",
+                table_name="orders",
+                require_all_columns=True,
+            )
+
+    def test_shared_sqlalchemy_sources_support_cross_table_query(self, sqlite_sources):
+        executor = DataSourceExecutor(sqlite_sources)
+        result = executor.execute_query(
+            "SELECT o.order_id, c.name "
+            "FROM orders o JOIN customers c ON o.customer_id = c.id"
+        )
+        nw_df = nw.from_native(result, eager_only=True)
+        assert set(nw_df.columns) == {"order_id", "name"}
+        assert nw_df.shape[0] == 3
+
+    def test_rejects_sqlalchemy_sources_with_different_engines(self):
+        orders_db = tempfile.NamedTemporaryFile(delete=False, suffix=".db")  # noqa: SIM115
+        customers_db = tempfile.NamedTemporaryFile(delete=False, suffix=".db")  # noqa: SIM115
+        orders_db.close()
+        customers_db.close()
+
+        orders_engine = create_engine(f"sqlite:///{orders_db.name}")
+        customers_engine = create_engine(f"sqlite:///{customers_db.name}")
+
+        try:
+            with orders_engine.begin() as conn:
+                conn.execute(
+                    text("""
+                        CREATE TABLE orders (
+                            order_id INTEGER,
+                            customer_id INTEGER
+                        )
+                    """)
+                )
+            with customers_engine.begin() as conn:
+                conn.execute(
+                    text("""
+                        CREATE TABLE customers (
+                            id INTEGER,
+                            name TEXT
+                        )
+                    """)
+                )
+
+            with pytest.raises(ValueError, match="share the same Engine instance"):
+                DataSourceExecutor({
+                    "orders": SQLAlchemySource(orders_engine, "orders"),
+                    "customers": SQLAlchemySource(customers_engine, "customers"),
+                })
+        finally:
+            orders_engine.dispose()
+            customers_engine.dispose()
+            Path(orders_db.name).unlink()
+            Path(customers_db.name).unlink()
+
+    def test_shared_ibis_sources_support_cross_table_query(self, ibis_sources):
+        executor = DataSourceExecutor(ibis_sources)
+        result = executor.execute_query(
+            "SELECT o.order_id, c.name "
+            "FROM orders o JOIN customers c ON o.customer_id = c.id"
+        )
+        collected = result.execute()
+        assert set(collected.columns) == {"order_id", "name"}
+        assert collected.shape[0] == 3
+
+    def test_rejects_ibis_sources_with_different_backends(self):
+        ibis = pytest.importorskip("ibis")
+        orders_conn = ibis.duckdb.connect()
+        customers_conn = ibis.duckdb.connect()
+
+        try:
+            orders_conn.create_table("orders", {"order_id": [1], "customer_id": [10]})
+            customers_conn.create_table("customers", {"id": [10], "name": ["Alice"]})
+
+            with pytest.raises(ValueError, match="share the same backend instance"):
+                DataSourceExecutor({
+                    "orders": IbisSource(orders_conn.table("orders"), "orders"),
+                    "customers": IbisSource(customers_conn.table("customers"), "customers"),
+                })
+        finally:
+            orders_conn.disconnect()
+            customers_conn.disconnect()
+
+    def test_cleanup_noop(self, orders_source):
+        executor = DataSourceExecutor({"orders": orders_source})
+        executor.cleanup()
+
+
+def test_datasource_executor_get_column_metas() -> None:
+    df = pl.DataFrame({"id": [1, 2], "name": ["a", "b"]})
+    source = DataFrameSource(nw.from_native(df), "t")
+    executor = DataSourceExecutor({"t": source})
+    metas = executor.get_column_metas("t")
+    assert [m.name for m in metas] == ["id", "name"]
+    assert all(m.min_val is None for m in metas)
+
+
+def test_datasource_executor_get_schema() -> None:
+    df = pl.DataFrame({"id": [1, 2, 3], "val": [10.0, 20.0, 30.0]})
+    source = DataFrameSource(nw.from_native(df), "t")
+    executor = DataSourceExecutor({"t": source})
+    schema = executor.get_schema("t", categorical_threshold=10)
+    assert "Table: t" in schema
+    assert "id" in schema
+    assert "val" in schema
+
+
+def test_duckdb_executor_get_column_metas() -> None:
+    df1 = pl.DataFrame({"id": [1, 2], "val": [10.0, 20.0]})
+    df2 = pl.DataFrame({"id": [1, 2], "name": ["a", "b"]})
+    source1 = DataFrameSource(nw.from_native(df1), "t1")
+    source2 = DataFrameSource(nw.from_native(df2), "t2")
+    executor = DuckDBExecutor({"t1": source1, "t2": source2})
+    metas = executor.get_column_metas("t1")
+    assert [m.name for m in metas] == ["id", "val"]
+
+
+def test_duckdb_executor_get_schema() -> None:
+    df1 = pl.DataFrame({"id": [1, 2, 3], "val": [10.0, 20.0, 30.0]})
+    df2 = pl.DataFrame({"id": [1], "name": ["x"]})
+    source1 = DataFrameSource(nw.from_native(df1), "t1")
+    source2 = DataFrameSource(nw.from_native(df2), "t2")
+    executor = DuckDBExecutor({"t1": source1, "t2": source2})
+    schema = executor.get_schema("t1", categorical_threshold=10)
+    assert "Table: t1" in schema
+    assert "Range:" in schema
diff --git a/pkg-py/tests/test_querychat.py b/pkg-py/tests/test_querychat.py
index 7d8b94258..3293e3560 100644
--- a/pkg-py/tests/test_querychat.py
+++ b/pkg-py/tests/test_querychat.py
@@ -1,6 +1,7 @@
 import os
 from unittest.mock import patch
 
+import ibis
 import pandas as pd
 import polars as pl
 import pytest
@@ -45,7 +46,7 @@ def test_querychat_init(sample_df):
     assert qc.id == "querychat_test_table"
 
     # Even without server initialization, we should be able to query the data source
-    result = qc.data_source.execute_query(
+    result = qc._data_sources["test_table"].execute_query(
         "SELECT * FROM test_table WHERE id = 2",
     )
 
@@ -87,6 +88,10 @@ def test_querychat_client_has_system_prompt(sample_df):
     # The system_prompt should contain the table name since it includes schema info
     assert "test_table" in client.system_prompt
 
+    # The system_prompt property should also return the prompt with table info
+    assert qc.system_prompt is not None
+    assert "test_table" in qc.system_prompt
+
 
 def test_generate_greeting_uses_querychat_system_prompt(sample_df):
     """generate_greeting() should use the dataset-aware querychat system prompt."""
@@ -144,10 +149,10 @@ def test_querychat_with_polars_lazyframe():
     )
 
     # Should have created a PolarsLazySource
-    assert isinstance(qc.data_source, PolarsLazySource)
+    assert isinstance(qc._data_sources["test_table"], PolarsLazySource)
 
     # Query should return a native polars LazyFrame
-    result = qc.data_source.execute_query("SELECT * FROM test_table WHERE id = 2")
+    result = qc._data_sources["test_table"].execute_query("SELECT * FROM test_table WHERE id = 2")
     assert isinstance(result, pl.LazyFrame)
 
     # Collect to verify
@@ -158,8 +163,6 @@ def test_querychat_with_polars_lazyframe():
 
 def test_querychat_with_ibis_table():
     """Test that QueryChat accepts an Ibis Table."""
-    ibis = pytest.importorskip("ibis")
-
     conn = ibis.duckdb.connect()
     try:
         conn.create_table(
@@ -179,10 +182,10 @@ def test_querychat_with_ibis_table():
         )
 
         # Should have created an IbisSource
-        assert isinstance(qc.data_source, IbisSource)
+        assert isinstance(qc._data_sources["test_table"], IbisSource)
 
         # Query should return an ibis.Table
-        result = qc.data_source.execute_query("SELECT * FROM test_table WHERE id = 2")
+        result = qc._data_sources["test_table"].execute_query("SELECT * FROM test_table WHERE id = 2")
         assert isinstance(result, ibis.Table)
 
         # Execute to verify results
diff --git a/pkg-py/tests/test_state.py b/pkg-py/tests/test_state.py
index 44bca227b..d9fcfef22 100644
--- a/pkg-py/tests/test_state.py
+++ b/pkg-py/tests/test_state.py
@@ -7,7 +7,9 @@
 import narwhals.stable.v1 as nw
 import pandas as pd
 import pytest
+from querychat import QueryChat
 from querychat._datasource import DataFrameSource
+from querychat._querychat_base import StateDictQueryChat
 from querychat._querychat_core import (
     AppState,
     create_app_state,
@@ -50,43 +52,50 @@ def mock_client():
 
 class TestAppState:
     def test_initial_state(self, data_source, mock_client):
-        state = AppState(data_source=data_source, client=mock_client)
-        assert state.data_source is data_source
+        state = AppState(data_sources={"test_table": data_source}, client=mock_client)
+        assert state.data_sources["test_table"] is data_source
         assert state.client is mock_client
         assert state.greeting is None
+        assert state.active_table == "test_table"
         assert state.sql is None
         assert state.title is None
 
     def test_with_greeting(self, data_source, mock_client):
         state = AppState(
-            data_source=data_source, client=mock_client, greeting="Welcome!"
+            data_sources={"test_table": data_source}, client=mock_client, greeting="Welcome!"
         )
         assert state.greeting == "Welcome!"
 
     def test_update_dashboard(self, data_source, mock_client):
-        state = AppState(data_source=data_source, client=mock_client)
+        state = AppState(data_sources={"test_table": data_source}, client=mock_client)
         state.update_dashboard(
-            {"query": "SELECT * FROM test_table", "title": "All Data"}
+            {
+                "table": "test_table",
+                "query": "SELECT * FROM test_table",
+                "title": "All Data",
+            }
         )
+        assert state.active_table == "test_table"
         assert state.sql == "SELECT * FROM test_table"
         assert state.title == "All Data"
 
     def test_reset_dashboard(self, data_source, mock_client):
-        state = AppState(data_source=data_source, client=mock_client)
+        state = AppState(data_sources={"test_table": data_source}, client=mock_client)
         state.sql = "SELECT * FROM test_table"
         state.title = "Test"
         state.reset_dashboard()
+        assert state.active_table == "test_table"
         assert state.sql is None
         assert state.title is None
 
     def test_get_current_data_without_sql(self, data_source, mock_client, sample_df):
-        state = AppState(data_source=data_source, client=mock_client)
+        state = AppState(data_sources={"test_table": data_source}, client=mock_client)
         result = state.get_current_data()
         # Result is now native pandas DataFrame
         pd.testing.assert_frame_equal(result, sample_df.to_pandas())
 
     def test_get_current_data_with_valid_sql(self, data_source, mock_client):
-        state = AppState(data_source=data_source, client=mock_client)
+        state = AppState(data_sources={"test_table": data_source}, client=mock_client)
         state.sql = "SELECT * FROM test_table WHERE age > 25"
         result = state.get_current_data()
         assert len(result) == 2
@@ -96,7 +105,7 @@ def test_get_current_data_with_valid_sql(self, data_source, mock_client):
     def test_get_current_data_with_invalid_sql_resets(
         self, data_source, mock_client, sample_df
     ):
-        state = AppState(data_source=data_source, client=mock_client)
+        state = AppState(data_sources={"test_table": data_source}, client=mock_client)
         state.sql = "INVALID SQL QUERY"
         state.title = "Will be cleared"
         result = state.get_current_data()
@@ -108,34 +117,219 @@ def test_get_current_data_with_invalid_sql_resets(
         assert "Query syntax error:" in state.error
 
     def test_error_cleared_on_successful_query(self, data_source, mock_client):
-        state = AppState(data_source=data_source, client=mock_client)
+        state = AppState(data_sources={"test_table": data_source}, client=mock_client)
         state.error = "Previous error"
         state.sql = "SELECT * FROM test_table WHERE age > 25"
         result = state.get_current_data()
         assert len(result) == 2
         assert state.error is None
 
+    def test_get_current_data_without_sql_preserves_existing_error(
+        self, data_source, mock_client, sample_df
+    ):
+        state = AppState(data_sources={"test_table": data_source}, client=mock_client)
+        state.error = "Previous error"
+
+        result = state.get_current_data()
+
+        pd.testing.assert_frame_equal(result, sample_df.to_pandas())
+        assert state.error == "Previous error"
+
     def test_error_cleared_on_update_dashboard(self, data_source, mock_client):
-        state = AppState(data_source=data_source, client=mock_client)
+        state = AppState(data_sources={"test_table": data_source}, client=mock_client)
         state.error = "Previous error"
-        state.update_dashboard({"query": "SELECT * FROM test_table", "title": "Test"})
+        state.update_dashboard(
+            {
+                "table": "test_table",
+                "query": "SELECT * FROM test_table",
+                "title": "Test",
+            }
+        )
+        assert state.error is None
+
+    def test_get_current_data_uses_query_executor_for_multi_table_dashboard_sql(
+        self, mock_client
+    ):
+        orders = pd.DataFrame(
+            {
+                "id": [1, 2, 3],
+                "customer_id": [101, 102, 101],
+                "amount": [100.0, 200.0, 150.0],
+            }
+        )
+        customers = pd.DataFrame(
+            {
+                "id": [101, 102],
+                "state": ["CA", "NY"],
+            }
+        )
+        qc = QueryChat(orders, "orders")
+        qc.add_table(customers, "customers")
+
+        state = AppState(
+            data_sources=dict(qc._data_sources),
+            client=mock_client,
+            query_executor=qc._require_query_executor("test"),
+        )
+        state.update_dashboard(
+            {
+                "table": "orders",
+                "query": (
+                    "SELECT orders.* "
+                    "FROM orders "
+                    "JOIN customers ON orders.customer_id = customers.id "
+                    "WHERE customers.state = 'CA'"
+                ),
+                "title": "California orders",
+            }
+        )
+
+        result = state.get_current_data()
+
+        assert result["id"].tolist() == [1, 3]
         assert state.error is None
 
+    def test_get_current_data_with_invalid_sql_falls_back_to_active_table(
+        self, mock_client
+    ):
+        orders = pd.DataFrame(
+            {
+                "id": [1, 2, 3],
+                "customer_id": [101, 102, 101],
+                "amount": [100.0, 200.0, 150.0],
+            }
+        )
+        customers = pd.DataFrame(
+            {
+                "id": [101, 102],
+                "state": ["CA", "NY"],
+            }
+        )
+        qc = QueryChat(orders, "orders")
+        qc.add_table(customers, "customers")
+
+        state = AppState(
+            data_sources=dict(qc._data_sources),
+            client=mock_client,
+            query_executor=qc._require_query_executor("test"),
+        )
+        state.update_dashboard(
+            {
+                "table": "customers",
+                "query": "SELECT missing_column FROM customers",
+                "title": "Broken customer query",
+            }
+        )
+
+        result = state.get_current_data()
+
+        assert result["id"].tolist() == [101, 102]
+        assert result["state"].tolist() == ["CA", "NY"]
+        assert state.active_table == "customers"
+        assert state.sql is None
+        assert state.title is None
+        assert state.error is not None
+
     def test_error_cleared_on_reset_dashboard(self, data_source, mock_client):
-        state = AppState(data_source=data_source, client=mock_client)
+        state = AppState(data_sources={"test_table": data_source}, client=mock_client)
         state.error = "Previous error"
         state.reset_dashboard()
         assert state.error is None
 
     def test_get_display_sql_without_sql(self, data_source, mock_client):
-        state = AppState(data_source=data_source, client=mock_client)
+        state = AppState(data_sources={"test_table": data_source}, client=mock_client)
         assert state.get_display_sql() == "SELECT * FROM test_table"
 
     def test_get_display_sql_with_sql(self, data_source, mock_client):
-        state = AppState(data_source=data_source, client=mock_client)
+        state = AppState(data_sources={"test_table": data_source}, client=mock_client)
         state.sql = "SELECT name FROM test_table"
         assert state.get_display_sql() == "SELECT name FROM test_table"
 
+    def test_update_dashboard_preserves_other_table_state(self, mock_client):
+        """Updating table B should not clobber table A's sql/title."""
+        orders = pd.DataFrame({"id": [1, 2], "amount": [100.0, 200.0]})
+        customers = pd.DataFrame({"id": [101, 102], "state": ["CA", "NY"]})
+        qc = QueryChat(orders, "orders")
+        qc.add_table(customers, "customers")
+
+        state = AppState(
+            data_sources=dict(qc._data_sources),
+            client=mock_client,
+            query_executor=qc._require_query_executor("test"),
+        )
+
+        state.update_dashboard(
+            {"table": "orders", "query": "SELECT * FROM orders WHERE amount > 100", "title": "Big orders"}
+        )
+        state.update_dashboard(
+            {"table": "customers", "query": "SELECT * FROM customers WHERE state = 'CA'", "title": "CA customers"}
+        )
+
+        # orders' filter should still be intact
+        assert state._table_states["orders"]["sql"] == "SELECT * FROM orders WHERE amount > 100"
+        assert state._table_states["orders"]["title"] == "Big orders"
+        # customers is now active
+        assert state.active_table == "customers"
+        assert state.sql == "SELECT * FROM customers WHERE state = 'CA'"
+
+    def test_to_dict_includes_per_table_states(self, mock_client):
+        """to_dict() should include all tables' sql/title/error, not just the active one."""
+        orders = pd.DataFrame({"id": [1, 2], "amount": [100.0, 200.0]})
+        customers = pd.DataFrame({"id": [101, 102], "state": ["CA", "NY"]})
+        qc = QueryChat(orders, "orders")
+        qc.add_table(customers, "customers")
+
+        mock_client.get_turns.return_value = []
+        state = AppState(
+            data_sources=dict(qc._data_sources),
+            client=mock_client,
+            query_executor=qc._require_query_executor("test"),
+        )
+        state.update_dashboard(
+            {"table": "orders", "query": "SELECT * FROM orders WHERE amount > 100", "title": "Big orders"}
+        )
+        state.update_dashboard(
+            {"table": "customers", "query": "SELECT * FROM customers WHERE state = 'CA'", "title": "CA customers"}
+        )
+
+        result = state.to_dict()
+
+        assert "table_states" in result
+        assert result["table_states"]["orders"]["sql"] == "SELECT * FROM orders WHERE amount > 100"
+        assert result["table_states"]["customers"]["sql"] == "SELECT * FROM customers WHERE state = 'CA'"
+
+    def test_update_from_dict_restores_per_table_states(self, mock_client):
+        """update_from_dict() should restore all tables' sql/title/error."""
+        orders = pd.DataFrame({"id": [1, 2], "amount": [100.0, 200.0]})
+        customers = pd.DataFrame({"id": [101, 102], "state": ["CA", "NY"]})
+        qc = QueryChat(orders, "orders")
+        qc.add_table(customers, "customers")
+
+        state = AppState(
+            data_sources=dict(qc._data_sources),
+            client=mock_client,
+            query_executor=qc._require_query_executor("test"),
+        )
+
+        state.update_from_dict(
+            {
+                "table": "customers",
+                "sql": "SELECT * FROM customers WHERE state = 'CA'",
+                "title": "CA customers",
+                "error": None,
+                "table_states": {
+                    "orders": {"sql": "SELECT * FROM orders WHERE amount > 100", "title": "Big orders", "error": None},
+                    "customers": {"sql": "SELECT * FROM customers WHERE state = 'CA'", "title": "CA customers", "error": None},
+                },
+                "turns": [],
+            }
+        )
+
+        assert state.active_table == "customers"
+        assert state.sql == "SELECT * FROM customers WHERE state = 'CA'"
+        assert state._table_states["orders"]["sql"] == "SELECT * FROM orders WHERE amount > 100"
+        assert state._table_states["orders"]["title"] == "Big orders"
+
 
 class TestCreateAppState:
     def test_creates_state_with_callbacks(self, data_source):
@@ -147,21 +341,129 @@ def client_factory(update_callback, reset_callback):
             callback_data["reset_callback"] = reset_callback
             return MagicMock()
 
-        state = create_app_state(data_source, client_factory, greeting="Welcome!")
+        state = create_app_state(
+            data_sources={"test_table": data_source},
+            client_factory=client_factory,
+            greeting="Welcome!",
+        )
         assert state.greeting == "Welcome!"
-        assert state.data_source is data_source
+        assert state.data_sources["test_table"] is data_source
 
         # Test that the update callback works
-        callback_data["update_callback"]({"query": "SELECT 1", "title": "Test"})
+        callback_data["update_callback"](
+            {"table": "test_table", "query": "SELECT 1", "title": "Test"}
+        )
         assert state.sql == "SELECT 1"
         assert state.title == "Test"
 
         # Test that the reset callback works
-        callback_data["reset_callback"]()
+        callback_data["reset_callback"]("test_table")
+        assert state.active_table == "test_table"
         assert state.sql is None
         assert state.title is None
 
 
+class DummyStateAccessor(StateDictQueryChat[pd.DataFrame]):
+    def __init__(self, qc: QueryChat):
+        self._data_sources = dict(qc._data_sources)
+        self._query_executor = qc._require_query_executor("test")
+        self.greeting = None
+
+    def _require_initialized(self, _method_name: str):
+        pass
+
+    def _require_query_executor(self, _method_name: str):
+        return self._query_executor
+
+    def client(self, **_kwargs):
+        return MagicMock()
+
+
+class TestStateDictQueryChat:
+    def test_df_uses_query_executor_for_multi_table_dashboard_sql(self):
+        orders = pd.DataFrame(
+            {
+                "id": [1, 2, 3],
+                "customer_id": [101, 102, 101],
+                "amount": [100.0, 200.0, 150.0],
+            }
+        )
+        customers = pd.DataFrame(
+            {
+                "id": [101, 102],
+                "state": ["CA", "NY"],
+            }
+        )
+        qc = QueryChat(orders, "orders")
+        qc.add_table(customers, "customers")
+        accessor = DummyStateAccessor(qc)
+        sql = (
+            "SELECT orders.* "
+            "FROM orders "
+            "JOIN customers ON orders.customer_id = customers.id "
+            "WHERE customers.state = 'CA'"
+        )
+
+        result = accessor.df(
+            {
+                "table_states": {
+                    "orders": {"sql": sql, "title": "California orders", "error": None},
+                    "customers": {"sql": None, "title": None, "error": None},
+                },
+                "table": "orders",
+                "sql": sql,
+                "title": "California orders",
+                "error": None,
+                "turns": [],
+            },
+            table="orders",
+        )
+
+        assert result["id"].tolist() == [1, 3]
+
+    def test_df_uses_active_table_for_full_data_and_error_fallback(self):
+        orders = pd.DataFrame(
+            {
+                "id": [1, 2, 3],
+                "customer_id": [101, 102, 101],
+                "amount": [100.0, 200.0, 150.0],
+            }
+        )
+        customers = pd.DataFrame(
+            {
+                "id": [101, 102],
+                "state": ["CA", "NY"],
+            }
+        )
+        qc = QueryChat(orders, "orders")
+        qc.add_table(customers, "customers")
+        accessor = DummyStateAccessor(qc)
+
+        full_result = accessor.df(
+            {
+                "table": "customers",
+                "sql": None,
+                "title": None,
+                "error": None,
+                "turns": [],
+            },
+            table="customers",
+        )
+        error_result = accessor.df(
+            {
+                "table": "customers",
+                "sql": "SELECT missing_column FROM customers",
+                "title": "Broken customer query",
+                "error": None,
+                "turns": [],
+            },
+            table="customers",
+        )
+
+        assert full_result["id"].tolist() == [101, 102]
+        assert error_result["id"].tolist() == [101, 102]
+
+
 class TestStreamResponse:
     def test_stream_response_yields_strings(self):
         mock_client = MagicMock()
@@ -217,7 +519,7 @@ def failing_generator():
 class TestGetDisplayMessages:
     def test_empty_turns(self, data_source, mock_client):
         mock_client.get_turns.return_value = []
-        state = AppState(data_source=data_source, client=mock_client)
+        state = AppState(data_sources={"test_table": data_source}, client=mock_client)
         assert state.get_display_messages() == []
 
     def test_user_message(self, data_source, mock_client):
@@ -225,7 +527,7 @@ def test_user_message(self, data_source, mock_client):
 
         user_turn = Turn(role="user", contents="Hello world")
         mock_client.get_turns.return_value = [user_turn]
-        state = AppState(data_source=data_source, client=mock_client)
+        state = AppState(data_sources={"test_table": data_source}, client=mock_client)
         messages = state.get_display_messages()
         assert len(messages) == 1
         assert messages[0] == {"role": "user", "content": "Hello world"}
@@ -235,7 +537,7 @@ def test_assistant_message(self, data_source, mock_client):
 
         assistant_turn = Turn(role="assistant", contents="Hi there!")
         mock_client.get_turns.return_value = [assistant_turn]
-        state = AppState(data_source=data_source, client=mock_client)
+        state = AppState(data_sources={"test_table": data_source}, client=mock_client)
         messages = state.get_display_messages()
         assert len(messages) == 1
         assert messages[0] == {"role": "assistant", "content": "Hi there!"}
@@ -248,7 +550,7 @@ def test_multiple_messages(self, data_source, mock_client):
             Turn(role="assistant", contents="Answer"),
         ]
         mock_client.get_turns.return_value = turns
-        state = AppState(data_source=data_source, client=mock_client)
+        state = AppState(data_sources={"test_table": data_source}, client=mock_client)
         messages = state.get_display_messages()
         assert len(messages) == 2
         assert messages[0] == {"role": "user", "content": "Question"}
@@ -260,6 +562,7 @@ def test_app_state_dict_structure(self):
         from querychat._querychat_core import AppStateDict
 
         state: AppStateDict = {
+            "table": "test",
             "sql": "SELECT * FROM test",
             "title": "Test",
             "error": None,
@@ -279,12 +582,13 @@ def test_to_dict_includes_turns(self, data_source, mock_client):
         assistant_turn = Turn(role="assistant", contents="Hi!")
         mock_client.get_turns.return_value = [user_turn, assistant_turn]
 
-        state = AppState(data_source=data_source, client=mock_client)
+        state = AppState(data_sources={"test_table": data_source}, client=mock_client)
         state.sql = "SELECT * FROM test"
         state.title = "Test"
 
         result = state.to_dict()
 
+        assert result["table"] == "test_table"
         assert result["sql"] == "SELECT * FROM test"
         assert result["title"] == "Test"
         assert "turns" in result
@@ -295,17 +599,18 @@ def test_to_dict_includes_turns(self, data_source, mock_client):
 
     def test_to_dict_empty_turns(self, data_source, mock_client):
         mock_client.get_turns.return_value = []
-        state = AppState(data_source=data_source, client=mock_client)
+        state = AppState(data_sources={"test_table": data_source}, client=mock_client)
         result = state.to_dict()
         assert result["turns"] == []
 
 
 class TestAppStateDeserialization:
     def test_update_from_dict_restores_turns(self, data_source, mock_client):
-        state = AppState(data_source=data_source, client=mock_client)
+        state = AppState(data_sources={"test_table": data_source}, client=mock_client)
 
         state.update_from_dict(
             {
+                "table": "test_table",
                 "sql": "SELECT name FROM test",
                 "title": "Names Only",
                 "error": None,
@@ -324,6 +629,7 @@ def test_update_from_dict_restores_turns(self, data_source, mock_client):
             }
         )
 
+        assert state.active_table == "test_table"
         assert state.sql == "SELECT name FROM test"
         assert state.title == "Names Only"
         mock_client.set_turns.assert_called_once()
@@ -333,6 +639,14 @@ def test_update_from_dict_restores_turns(self, data_source, mock_client):
         assert turns_arg[1].role == "assistant"
 
     def test_update_from_dict_empty_turns(self, data_source, mock_client):
-        state = AppState(data_source=data_source, client=mock_client)
-        state.update_from_dict({"sql": None, "title": None, "error": None, "turns": []})
+        state = AppState(data_sources={"test_table": data_source}, client=mock_client)
+        state.update_from_dict(
+            {
+                "table": "test_table",
+                "sql": None,
+                "title": None,
+                "error": None,
+                "turns": [],
+            }
+        )
         mock_client.set_turns.assert_called_with([])
diff --git a/pkg-py/tests/test_system_prompt.py b/pkg-py/tests/test_system_prompt.py
index 976362045..db036869e 100644
--- a/pkg-py/tests/test_system_prompt.py
+++ b/pkg-py/tests/test_system_prompt.py
@@ -5,7 +5,9 @@
 
 import narwhals.stable.v1 as nw
 import pandas as pd
+import polars as pl
 import pytest
+from querychat._data_dict import DataDict, RelationshipSpec, TableSpec
 from querychat._datasource import DataFrameSource
 from querychat._system_prompt import QueryChatSystemPrompt
 
@@ -29,7 +31,7 @@ def sample_data_source():
 def sample_prompt_template():
     """Create a sample prompt template for testing."""
     return """Database Type: {{db_type}}
-Schema: {{schema}}
+Tables: {{{tables_overview}}}
 {{#data_description}}Data: {{data_description}}{{/data_description}}
 {{#extra_instructions}}Instructions: {{extra_instructions}}{{/extra_instructions}}
 {{#has_tool_update}}UPDATE TOOL ENABLED{{/has_tool_update}}
@@ -38,6 +40,80 @@ def sample_prompt_template():
 """
 
 
+def _make_system_prompt(
+    data_sources: dict,
+    data_dicts: list[DataDict] | None = None,
+    **kwargs,
+) -> QueryChatSystemPrompt:
+    return QueryChatSystemPrompt(
+        prompt_template=None,
+        data_sources=data_sources,
+        data_dicts=data_dicts or [],
+        **kwargs,
+    )
+
+
+def test_system_prompt_contains_table_names(sample_data_source) -> None:
+    sp = _make_system_prompt({"mytable": sample_data_source})
+    rendered = sp.render({"query"})
+    assert "mytable" in rendered
+
+
+def test_system_prompt_no_schema_block(sample_data_source) -> None:
+    sp = _make_system_prompt({"mytable": sample_data_source})
+    rendered = sp.render({"query"})
+    # Schema block should be gone — no "Columns:" section in prompt
+    assert "Columns:" not in rendered
+
+
+def test_system_prompt_includes_table_description() -> None:
+    df = nw.from_native(pl.DataFrame({"x": [1]}))
+    source = DataFrameSource(df, "orders")
+    dd = DataDict(
+        tables={"orders": TableSpec(description="Order records.")},
+    )
+    sp = _make_system_prompt({"orders": source}, data_dicts=[dd])
+    rendered = sp.render({"query"})
+    assert "Order records." in rendered
+
+
+def test_system_prompt_includes_glossary() -> None:
+    df = nw.from_native(pl.DataFrame({"x": [1]}))
+    source = DataFrameSource(df, "orders")
+    dd = DataDict(
+        tables={"orders": TableSpec(columns=[])},
+        glossary={"churn": "No orders in 90 days."},
+    )
+    sp = _make_system_prompt({"orders": source}, data_dicts=[dd])
+    rendered = sp.render({"query"})
+    assert "churn" in rendered
+    assert "No orders in 90 days." in rendered
+
+
+def test_system_prompt_includes_relationships() -> None:
+    df = nw.from_native(pl.DataFrame({"x": [1]}))
+    source = DataFrameSource(df, "orders")
+    dd = DataDict(
+        tables={"orders": TableSpec(columns=[])},
+        relationships=[
+            RelationshipSpec(
+                join="orders.customer_id = customers.id",
+                cardinality="many-to-one",
+                description="Order placed by customer.",
+            )
+        ],
+    )
+    sp = _make_system_prompt({"orders": source}, data_dicts=[dd])
+    rendered = sp.render({"query"})
+    assert "orders.customer_id = customers.id" in rendered
+
+
+def test_system_prompt_no_glossary_section_when_empty(sample_data_source) -> None:
+    sp = _make_system_prompt({"t": sample_data_source})
+    rendered = sp.render({"query"})
+    assert "<glossary>" not in rendered
+
+
 class TestQueryChatSystemPromptInit:
     """Tests for QueryChatSystemPrompt initialization."""
 
@@ -54,8 +130,7 @@ def test_init_with_string_template(
         assert prompt.data_source == sample_data_source
         assert prompt.data_description is None
         assert prompt.extra_instructions is None
-        assert prompt.schema is not None
-        assert prompt.categorical_threshold == 10
+        assert prompt.categorical_threshold == 20
 
     def test_init_with_path_template(self, sample_data_source):
         """Test initialization with Path template."""
@@ -164,7 +239,7 @@ def test_render_with_both_tools(self, sample_data_source, sample_prompt_template
         assert "QUERY TOOL ENABLED" in rendered
         assert "QUERY GUIDELINES" in rendered
         assert "Database Type:" in rendered
-        assert "Schema:" in rendered
+        assert "Tables:" in rendered
 
     def test_render_with_query_only(self, sample_data_source, sample_prompt_template):
         """Test rendering with only query tool enabled."""
@@ -233,8 +308,10 @@ def test_render_includes_extra_instructions(
 
         assert "Instructions: Be very concise" in rendered
 
-    def test_render_includes_schema(self, sample_data_source, sample_prompt_template):
-        """Test that rendering includes schema information."""
+    def test_render_includes_table_name(
+        self, sample_data_source, sample_prompt_template
+    ):
+        """Test that rendering includes the table name in the overview."""
         prompt = QueryChatSystemPrompt(
             prompt_template=sample_prompt_template,
             data_source=sample_data_source,
@@ -242,9 +319,8 @@ def test_render_includes_schema(self, sample_data_source, sample_prompt_template
 
         rendered = prompt.render(tools=("query",))
 
-        assert "Schema:" in rendered
-        # Schema should contain table information
-        assert prompt.schema in rendered
+        assert "Tables:" in rendered
+        assert "test_table" in rendered
 
     def test_render_includes_db_type(self, sample_data_source, sample_prompt_template):
         """Test that rendering includes database type."""
@@ -259,47 +335,6 @@ def test_render_includes_db_type(self, sample_data_source, sample_prompt_templat
         assert sample_data_source.get_db_type() in rendered
 
 
-class TestSchemaInferenceSkip:
-    """Tests that schema inference is skipped when template doesn't reference {{schema}}."""
-
-    def test_schema_skipped_when_not_in_template(self, sample_data_source):
-        """Schema should be empty string when template doesn't use {{schema}}."""
-        prompt = QueryChatSystemPrompt(
-            prompt_template="No schema here: {{db_type}}",
-            data_source=sample_data_source,
-        )
-
-        assert prompt.schema == ""
-
-    def test_schema_computed_when_in_template(self, sample_data_source):
-        """Schema should be computed when template uses {{schema}}."""
-        prompt = QueryChatSystemPrompt(
-            prompt_template="Schema: {{schema}}",
-            data_source=sample_data_source,
-        )
-
-        assert prompt.schema != ""
-        assert "test_table" in prompt.schema
-
-    def test_schema_computed_for_triple_braces(self, sample_data_source):
-        """Schema should be computed for unescaped {{{schema}}} syntax."""
-        prompt = QueryChatSystemPrompt(
-            prompt_template="Schema: {{{schema}}}",
-            data_source=sample_data_source,
-        )
-
-        assert prompt.schema != ""
-
-    def test_schema_computed_for_conditional_section(self, sample_data_source):
-        """Schema should be computed for {{#schema}} conditional sections."""
-        prompt = QueryChatSystemPrompt(
-            prompt_template="{{#schema}}Has schema{{/schema}}",
-            data_source=sample_data_source,
-        )
-
-        assert prompt.schema != ""
-
-
 class TestVizPromptConditionals:
     """Tests for visualization-related conditional rendering in the real prompt."""
 
@@ -310,8 +345,6 @@ def test_graceful_recovery_fallback_excluded_without_query_tool(
         When only visualize is enabled (no query tool), the fallback
         to querychat_query should not appear in the rendered prompt.
         """
-        from pathlib import Path
-
         template_path = (
             Path(__file__).parent.parent
             / "src"
@@ -335,8 +368,6 @@ def test_collapsed_guidance_included_with_both_tools(
         When both query and visualize are enabled, the collapsed query
         guidance should appear in the system prompt.
         """
-        from pathlib import Path
-
         template_path = (
             Path(__file__).parent.parent
             / "src"
@@ -359,8 +390,6 @@ def test_viz_only_has_no_cannot_query_message(self, sample_data_source):
         should NOT contain "cannot query or analyze" and SHOULD contain
         "Visualizing Data".
         """
-        from pathlib import Path
-
         template_path = (
             Path(__file__).parent.parent
             / "src"
@@ -383,8 +412,6 @@ def test_collapsed_guidance_only_with_both_tools(self, sample_data_source):
         The "Avoid redundant expanded results" guidance should only appear
         when both query and visualize are enabled.
         """
-        from pathlib import Path
-
         template_path = (
             Path(__file__).parent.parent
             / "src"
@@ -404,3 +431,93 @@ def test_collapsed_guidance_only_with_both_tools(self, sample_data_source):
         assert "Avoid redundant expanded results" in rendered_both
         assert "Avoid redundant expanded results" not in rendered_query_only
         assert "Avoid redundant expanded results" not in rendered_viz_only
+
+
+class TestDataDictYamlRendering:
+    """Tests for YAML-based data dict rendering in the system prompt."""
+
+    def _make_source(self, table_name: str) -> DataFrameSource:
+        df = nw.from_native(pl.DataFrame({"x": [1]}))
+        return DataFrameSource(df, table_name)
+
+    def test_no_dict_renders_flat_tables_block(self) -> None:
+        sp = _make_system_prompt({"mytable": self._make_source("mytable")})
+        rendered = sp.render({"query"})
+        assert "<tables>" in rendered
+        assert "<data-dict" not in rendered
+
+    def test_single_dict_renders_xml_tag_with_name(self) -> None:
+        dd = DataDict(name="sales", tables={"orders": TableSpec(description="Orders.")})
+        sp = _make_system_prompt(
+            {"orders": self._make_source("orders")}, data_dicts=[dd]
+        )
+        rendered = sp.render({"query"})
+        assert '<data-dict name="sales">' in rendered
+        assert "Orders." in rendered
+
+    def test_xml_tag_includes_description_attribute(self) -> None:
+        dd = DataDict(name="sales", description="Sales domain data", tables={})
+        sp = _make_system_prompt(
+            {"orders": self._make_source("orders")}, data_dicts=[dd]
+        )
+        rendered = sp.render({"query"})
+        assert 'description="Sales domain data"' in rendered
+
+    def test_xml_tag_omits_description_when_absent(self) -> None:
+        dd = DataDict(name="sales", tables={})
+        sp = _make_system_prompt(
+            {"orders": self._make_source("orders")}, data_dicts=[dd]
+        )
+        rendered = sp.render({"query"})
+        assert "description=" not in rendered
+
+    def test_yaml_body_excludes_name_and_description(self) -> None:
+        dd = DataDict(name="sales", description="Sales domain data", tables={})
+        sp = _make_system_prompt(
+            {"orders": self._make_source("orders")}, data_dicts=[dd]
+        )
+        rendered = sp.render({"query"})
+        # name and description belong in the XML tag, not the YAML body
+        assert "name: sales" not in rendered
+        assert "description: Sales domain data" not in rendered
+
+    def test_yaml_body_includes_tables_relationships_glossary(self) -> None:
+        dd = DataDict(
+            name="sales",
+            tables={"orders": TableSpec(description="Order records.")},
+            relationships=[RelationshipSpec(join="orders.customer_id = customers.id")],
+            glossary={"churn": "No orders in 90 days."},
+        )
+        sp = _make_system_prompt(
+            {"orders": self._make_source("orders")}, data_dicts=[dd]
+        )
+        rendered = sp.render({"query"})
+        assert "orders.customer_id = customers.id" in rendered
+        assert "churn" in rendered
+        assert "Order records." in rendered
+
+    def test_multiple_dicts_render_sibling_xml_tags(self) -> None:
+        dd1 = DataDict(name="sales", tables={"orders": TableSpec(description="Orders")})
+        dd2 = DataDict(
+            name="catalog", tables={"products": TableSpec(description="Products")}
+        )
+        sp = _make_system_prompt(
+            {
+                "orders": self._make_source("orders"),
+                "products": self._make_source("products"),
+            },
+            data_dicts=[dd1, dd2],
+        )
+        rendered = sp.render({"query"})
+        assert '<data-dict name="sales">' in rendered
+        assert '<data-dict name="catalog">' in rendered
+        assert rendered.count("<data-dict") == 2
+
+    def test_multi_table_no_dict_emits_warning(self) -> None:
+        with pytest.warns(UserWarning, match="data_dict"):
+            _make_system_prompt(
+                {
+                    "orders": self._make_source("orders"),
+                    "products": self._make_source("products"),
+                }
+            )
diff --git a/pkg-py/tests/test_tools.py b/pkg-py/tests/test_tools.py
index baacb68ff..e7d631477 100644
--- a/pkg-py/tests/test_tools.py
+++ b/pkg-py/tests/test_tools.py
@@ -1,13 +1,25 @@
 """Tests for tool functions and utilities."""
 
+import html as html_module
 import warnings
 
 import narwhals.stable.v1 as nw
 import pandas as pd
+import polars as pl
 import pytest
+from htmltools import TagList
+from querychat._data_dict import ColumnRange, ColumnSpec, DataDict, TableSpec
 from querychat._datasource import DataFrameSource
+from querychat._query_executor import DataSourceExecutor
 from querychat._utils import querychat_tool_starts_open
-from querychat.tools import _query_impl
+from querychat.tools import (
+    GetSchemaResult,
+    UpdateDashboardData,
+    _get_schema_impl,
+    _query_impl,
+    tool_reset_dashboard,
+)
+from shinychat import message_content_chunk
 
 
 @pytest.fixture
@@ -16,36 +28,41 @@ def data_source():
     return DataFrameSource(df, "test_table")
 
 
+@pytest.fixture
+def executor(data_source):
+    return DataSourceExecutor({"test_table": data_source})
+
+
 class TestQueryCollapsedParameter:
     """Tests for the query tool's collapsed parameter."""
 
-    def test_collapsed_true_sets_open_false(self, data_source, monkeypatch):
+    def test_collapsed_true_sets_open_false(self, executor, monkeypatch):
         monkeypatch.delenv("QUERYCHAT_TOOL_DETAILS", raising=False)
-        query_fn = _query_impl(data_source)
+        query_fn = _query_impl(executor)
         result = query_fn("SELECT * FROM test_table", collapsed=True)
         assert result.extra["display"].open is False
 
-    def test_collapsed_false_sets_open_true(self, data_source, monkeypatch):
+    def test_collapsed_false_sets_open_true(self, executor, monkeypatch):
         monkeypatch.delenv("QUERYCHAT_TOOL_DETAILS", raising=False)
-        query_fn = _query_impl(data_source)
+        query_fn = _query_impl(executor)
         result = query_fn("SELECT * FROM test_table", collapsed=False)
         assert result.extra["display"].open is True
 
-    def test_collapsed_none_falls_back_to_default(self, data_source, monkeypatch):
+    def test_collapsed_none_falls_back_to_default(self, executor, monkeypatch):
         monkeypatch.delenv("QUERYCHAT_TOOL_DETAILS", raising=False)
-        query_fn = _query_impl(data_source)
+        query_fn = _query_impl(executor)
         result = query_fn("SELECT * FROM test_table")
         assert result.extra["display"].open is False  # default for query
 
-    def test_collapsed_overrides_env_expanded(self, data_source, monkeypatch):
+    def test_collapsed_overrides_env_expanded(self, executor, monkeypatch):
         monkeypatch.setenv("QUERYCHAT_TOOL_DETAILS", "expanded")
-        query_fn = _query_impl(data_source)
+        query_fn = _query_impl(executor)
         result = query_fn("SELECT * FROM test_table", collapsed=True)
         assert result.extra["display"].open is False
 
-    def test_collapsed_overrides_env_collapsed(self, data_source, monkeypatch):
+    def test_collapsed_overrides_env_collapsed(self, executor, monkeypatch):
         monkeypatch.setenv("QUERYCHAT_TOOL_DETAILS", "collapsed")
-        query_fn = _query_impl(data_source)
+        query_fn = _query_impl(executor)
         result = query_fn("SELECT * FROM test_table", collapsed=False)
         assert result.extra["display"].open is True
 
@@ -113,3 +130,125 @@ def test_querychat_tool_starts_open_invalid_setting(monkeypatch):
         assert len(w) == 1
         assert "Invalid value" in str(w[0].message)
         assert result is False  # Falls back to default behavior
+
+
+def test_update_dashboard_data_has_table_field():
+    """Test that UpdateDashboardData includes table field."""
+    # TypedDict should have table as a key
+    assert "table" in UpdateDashboardData.__annotations__
+
+
+def test_reset_dashboard_accepts_table_parameter():
+    """Test that reset_dashboard tool accepts table parameter."""
+    reset_tables = []
+
+    def callback(table: str):
+        reset_tables.append(table)
+
+    tool = tool_reset_dashboard(callback, ["orders"])
+
+    # The tool function should accept table parameter
+    tool.func(table="orders")
+
+    assert reset_tables == ["orders"]
+
+
+def test_reset_dashboard_rejects_unknown_table():
+    """Reset dashboard should fail fast for an unknown table name."""
+    reset_tables = []
+
+    def callback(table: str):
+        reset_tables.append(table)
+
+    tool = tool_reset_dashboard(callback, ["orders"])
+
+    result = tool.func(table="customers")
+
+    assert reset_tables == []
+    assert result.error is not None
+    assert "Table 'customers' not found" in str(result.error)
+
+
+def test_reset_dashboard_without_table_names_preserves_legacy_signature():
+    """Public helper should still work without passing table_names."""
+    reset_tables = []
+
+    def callback(table: str):
+        reset_tables.append(table)
+
+    tool = tool_reset_dashboard(callback)
+
+    tool.func(table="customers")
+
+    assert reset_tables == ["customers"]
+
+
+def _make_executor_and_table(
+    df: pl.DataFrame, table_name: str
+) -> tuple[DataSourceExecutor, list[str]]:
+    source = DataFrameSource(nw.from_native(df), table_name)
+    executor = DataSourceExecutor({table_name: source})
+    return executor, [table_name]
+
+
+def test_get_schema_impl_with_data_dict() -> None:
+    dd = DataDict(
+        tables={
+            "orders": TableSpec(
+                columns=[ColumnSpec(name="amount", range=ColumnRange(min=0, max=100))]
+            )
+        },
+    )
+    df = pl.DataFrame({"amount": [10, 20]})
+    executor, table_names = _make_executor_and_table(df, "orders")
+    fn = _get_schema_impl([dd], executor, table_names, categorical_threshold=10)
+    result = fn("orders")
+    assert "amount" in str(result.value)
+    assert "Range: 0 to 100" in str(result.value)
+
+
+def test_get_schema_impl_without_data_dict() -> None:
+    df = pl.DataFrame({"amount": [10, 20, 30]})
+    executor, table_names = _make_executor_and_table(df, "orders")
+    fn = _get_schema_impl([], executor, table_names, categorical_threshold=10)
+    result = fn("orders")
+    assert "amount" in str(result.value)
+
+
+def test_get_schema_impl_unknown_table_returns_error() -> None:
+    df = pl.DataFrame({"amount": [1]})
+    executor, table_names = _make_executor_and_table(df, "orders")
+    fn = _get_schema_impl([], executor, table_names, categorical_threshold=10)
+    result = fn("nonexistent")
+    assert result.error is not None
+    assert "nonexistent" in str(result.error)
+
+
+def test_get_schema_result_sentinel_has_data_attributes():
+    result = GetSchemaResult(
+        value="Table: orders\nColumns:\n- id (INTEGER)",
+        table_name="orders",
+    )
+    msg = message_content_chunk(result)
+    # msg.content is a pre-rendered HTML string; wrap in TagList to render again
+    rendered = TagList(msg.content).render()
+    html = rendered["html"]
+    assert "qc-schema-collector" in html
+    assert 'data-table="orders"' in html
+    assert "display:none" in html
+
+
+def test_get_schema_result_sentinel_embeds_schema():
+    schema = "Table: orders\nColumns:\n- id (INTEGER)"
+    result = GetSchemaResult(value=schema, table_name="orders")
+    msg = message_content_chunk(result)
+    # ChatMessage pre-renders TagList to a string; unescape HTML entities to check schema
+    assert schema in html_module.unescape(msg.content)
+
+
+def test_get_schema_result_includes_js_dependency():
+    result = GetSchemaResult(value="Table: t\nColumns:\n- x (TEXT)", table_name="t")
+    msg = message_content_chunk(result)
+    # ChatMessage extracts HTMLDependency objects into html_deps
+    dep_names = [d.name for d in msg.html_deps]
+    assert "querychat-schema-display" in dep_names
diff --git a/pkg-py/tests/test_viz_tools.py b/pkg-py/tests/test_viz_tools.py
index 5d9c2db32..98d31e5c2 100644
--- a/pkg-py/tests/test_viz_tools.py
+++ b/pkg-py/tests/test_viz_tools.py
@@ -79,11 +79,11 @@ def test_ggsql_syntax_reference_does_not_repeat_charts_vs_tables_note():
 
 def test_main_prompt_render_includes_ggsql_reference(data_source):
     system_prompt = QueryChatSystemPrompt(
-        PROMPTS_DIR / "prompt.md",
+        prompt_template=PROMPTS_DIR / "prompt.md",
         data_source=data_source,
     )
 
-    prompt = system_prompt.render(("visualize",))
+    prompt = system_prompt.render({"visualize"})
 
     assert "querychat_visualize" in prompt
     assert "## ggsql Syntax Reference" in prompt
diff --git a/pkg-r/DESCRIPTION b/pkg-r/DESCRIPTION
index 2d10232b8..577e6a9c1 100644
--- a/pkg-r/DESCRIPTION
+++ b/pkg-r/DESCRIPTION
@@ -28,15 +28,17 @@ Imports:
     DBI,
     ellmer (>= 0.4.1),
     htmltools,
+    jsonlite,
     lifecycle,
     promises,
     R6,
     rlang (>= 1.1.0),
     S7,
     shiny,
-    shinychat (>= 0.4.0),
+    shinychat (> 0.4.0),
     utils,
-    whisker
+    whisker,
+    yaml
 Suggests:
     dbplyr,
     dplyr,
@@ -56,6 +58,8 @@ Suggests:
     withr
 VignetteBuilder:
     knitr
+Remotes:
+    posit-dev/shinychat/pkg-r
 Config/roxygen2/version: 8.0.0
 Config/testthat/edition: 3
 Config/testthat/parallel: true
diff --git a/pkg-r/NAMESPACE b/pkg-r/NAMESPACE
index 114c3c3ef..4361f3516 100644
--- a/pkg-r/NAMESPACE
+++ b/pkg-r/NAMESPACE
@@ -5,6 +5,7 @@ export(DataFrameSource)
 export(DataSource)
 export(PinSource)
 export(QueryChat)
+export(TableAccessor)
 export(TblSqlSource)
 export(querychat)
 export(querychat_app)
@@ -19,3 +20,4 @@ import(rlang)
 importFrom(R6,R6Class)
 importFrom(bslib,sidebar)
 importFrom(lifecycle,deprecated)
+importFrom(shinychat,contents_shinychat)
diff --git a/pkg-r/NEWS.md b/pkg-r/NEWS.md
index 5977f921f..199af36c9 100644
--- a/pkg-r/NEWS.md
+++ b/pkg-r/NEWS.md
@@ -2,14 +2,37 @@
 
 ## New features
 
+* `QueryChat$new()` now supports **multiple related tables**. Register additional tables with `$add_table()` and the LLM can reason across all of them — joins, cross-table filters, aggregations. Per-table reactive state (`$df()`, `$sql()`, `$title()`) is accessible via `qc_vals$table("name")` on the list returned by `$server()`. (#195)
+
+  ```r
+  qc <- QueryChat$new(orders_df, "orders")
+  qc$add_table(customers_df, "customers")
+
+  qc_vals <- qc$server()
+  qc_vals$table("orders")$df()
+  qc_vals$table("customers")$sql()
+  ```
+
+* A new **`data_dict`** parameter — integrating with the [data-dict](https://data-dict.tidyverse.org/) spec — lets you annotate tables and columns with plain-English descriptions loaded from a YAML file. This is the preferred way to provide additional context for the data, especially when multiple tables are relevant. The LLM receives these descriptions when it fetches the schema, helping it interpret ambiguous or domain-specific column names without any extra prompting. (#195)
+
+  ```r
+  QueryChat$new(data_dict = "data_dict.yaml")
+  ```
+
 * Added `PinSource`, a data source for chatting with datasets pinned to a [pins](https://pins.rstudio.com/) board. Works with parquet, CSV, JSON, and RDS pins, and uses the pin's title, description, and tags as the default data description. (#246)
 
 * File attachments are now enabled by default in the Shiny chat UI. Users can attach images, PDFs, and text files to their messages and the LLM will receive them. Disable with `allow_attachments = FALSE` in `mod_ui()` or `QueryChat$ui()`. (#253)
 
+## Breaking changes
+
+* The `$data_source` property has been removed. Use `qc$table("name")$data_source` to read a table's data source, and `qc$add_table(df, "name", replace = TRUE)` to replace it. The `data_source` parameter to `$server()` has also been removed; call `$add_table()` before `$server()` instead. (#195)
+
 ## Improvements
 
 * Chat greetings now use shinychat's greeting API (requires shinychat >= 0.4.0). A provided `greeting` renders instantly when the app loads, and when no `greeting` is given one is generated on demand without being added to the conversation history. Generated greetings are now preserved across bookmark/restore. (#249)
 
+* The system prompt is now lighter: full schema is no longer embedded upfront. Instead the LLM fetches per-table schema on demand via the new `querychat_get_schema` tool — and only when it needs to. When a `data_dict` is provided, the tool skips columns that already have descriptions, so the LLM only pays for what isn't already documented. (#195)
+
 # querychat 0.3.0
 
 ## New features
diff --git a/pkg-r/R/DBISource.R b/pkg-r/R/DBISource.R
index ee5ca4521..725c02d8c 100644
--- a/pkg-r/R/DBISource.R
+++ b/pkg-r/R/DBISource.R
@@ -58,10 +58,12 @@ DBISource <- R6::R6Class(
 
       # Check if table exists
       if (!DBI::dbExistsTable(conn, table_name)) {
-        cli::cli_abort(c(
-          "Table {.val {DBI::dbQuoteIdentifier(conn, table_name)}} not found in database",
-          "i" = "If you're using a table in a catalog or schema, pass a {.fn DBI::Id} object to {.arg table_name}"
-        ))
+        cli::cli_abort(
+          c(
+            "Table {.val {DBI::dbQuoteIdentifier(conn, table_name)}} not found in database",
+            "i" = "If you're using a table in a catalog or schema, pass a {.fn DBI::Id} object to {.arg table_name}"
+          )
+        )
       }
 
       private$conn <- conn
@@ -69,13 +71,15 @@ DBISource <- R6::R6Class(
 
       # Store original column names for validation
       # Use WHERE 1=0 instead of LIMIT 0 for SQL Server compatibility
-      private$colnames <- colnames(DBI::dbGetQuery(
-        conn,
-        sprintf(
-          "SELECT * FROM %s WHERE 1=0",
-          DBI::dbQuoteIdentifier(conn, table_name)
+      private$colnames <- colnames(
+        DBI::dbGetQuery(
+          conn,
+          sprintf(
+            "SELECT * FROM %s WHERE 1=0",
+            DBI::dbQuoteIdentifier(conn, table_name)
+          )
         )
-      ))
+      )
     },
 
     #' @description Get the database type
@@ -103,9 +107,34 @@ DBISource <- R6::R6Class(
     #' @param categorical_threshold Maximum number of unique values for a text
     #'   column to be considered categorical (default: 20)
     #' @return A string describing the schema
-    get_schema = function(categorical_threshold = 20) {
+    get_schema = function(categorical_threshold = 20, table_spec = NULL) {
       check_number_whole(categorical_threshold, min = 1)
-      get_schema_impl(private$conn, self$table_name, categorical_threshold)
+      get_schema_impl(
+        private$conn,
+        self$table_name,
+        categorical_threshold,
+        table_spec = table_spec
+      )
+    },
+
+    get_schema_result = function(
+      categorical_threshold = 20,
+      table_spec = NULL
+    ) {
+      check_number_whole(categorical_threshold, min = 1)
+      details <- build_column_details_impl(
+        private$conn,
+        self$table_name,
+        categorical_threshold,
+        table_spec = table_spec
+      )
+      list(
+        text = format_schema_from_details(
+          as.character(DBI::dbQuoteIdentifier(private$conn, self$table_name)),
+          details
+        ),
+        columns = details
+      )
     },
 
     #' @description
@@ -196,30 +225,29 @@ DBISource <- R6::R6Class(
   )
 )
 
-
-get_schema_impl <- function(
+# Returns a list of named lists (one per column) with all schema metadata.
+# Used by both format_schema_from_details() (LLM text) and JSON serialization (UI).
+build_column_details_impl <- function(
   conn,
   table_name,
   categorical_threshold = 20,
   columns = NULL,
-  prep_query = identity
+  prep_query = identity,
+  table_spec = NULL
 ) {
   check_function(prep_query)
 
-  # Get column information
-  columns <- columns %||% DBI::dbListFields(conn, table_name)
+  documented <- list()
+  for (spec in table_spec[["columns"]] %||% list()) {
+    documented[[spec[["name"]]]] <- spec
+  }
 
-  schema_lines <- c(
-    paste("Table:", DBI::dbQuoteIdentifier(conn, table_name)),
-    "Columns:"
-  )
+  columns <- columns %||% DBI::dbListFields(conn, table_name)
 
-  # Build single query to get column statistics
   select_parts <- character(0)
   numeric_columns <- character(0)
   text_columns <- character(0)
 
-  # Get sample of data to determine types
   # Use dbFetch(n=1) instead of LIMIT 1 for SQL Server compatibility
   sample_query <- paste0(
     "SELECT * FROM ",
@@ -230,6 +258,7 @@ get_schema_impl <- function(
   DBI::dbClearResult(rs)
 
   for (col in columns) {
+    spec <- documented[[col]]
     col_class <- class(sample_data[[col]])[1]
 
     if (
@@ -237,36 +266,39 @@ get_schema_impl <- function(
         c("integer", "numeric", "double", "Date", "POSIXct", "POSIXt")
     ) {
       numeric_columns <- c(numeric_columns, col)
-      select_parts <- c(
-        select_parts,
-        paste0(
-          "MIN(",
-          DBI::dbQuoteIdentifier(conn, col),
-          ") as ",
-          DBI::dbQuoteIdentifier(conn, paste0(col, '__min'))
-        ),
-        paste0(
-          "MAX(",
-          DBI::dbQuoteIdentifier(conn, col),
-          ") as ",
-          DBI::dbQuoteIdentifier(conn, paste0(col, '__max'))
+      if (is.null(spec[["range"]])) {
+        select_parts <- c(
+          select_parts,
+          paste0(
+            "MIN(",
+            DBI::dbQuoteIdentifier(conn, col),
+            ") as ",
+            DBI::dbQuoteIdentifier(conn, paste0(col, "__min"))
+          ),
+          paste0(
+            "MAX(",
+            DBI::dbQuoteIdentifier(conn, col),
+            ") as ",
+            DBI::dbQuoteIdentifier(conn, paste0(col, "__max"))
+          )
         )
-      )
+      }
     } else if (col_class %in% c("character", "factor")) {
       text_columns <- c(text_columns, col)
-      select_parts <- c(
-        select_parts,
-        paste0(
-          "COUNT(DISTINCT ",
-          DBI::dbQuoteIdentifier(conn, col),
-          ") as ",
-          DBI::dbQuoteIdentifier(conn, paste0(col, '__distinct_count'))
+      if (is.null(spec[["values"]])) {
+        select_parts <- c(
+          select_parts,
+          paste0(
+            "COUNT(DISTINCT ",
+            DBI::dbQuoteIdentifier(conn, col),
+            ") as ",
+            DBI::dbQuoteIdentifier(conn, paste0(col, "__distinct_count"))
+          )
         )
-      )
+      }
     }
   }
 
-  # Execute statistics query
   column_stats <- list()
   if (length(select_parts) > 0) {
     tryCatch(
@@ -278,21 +310,18 @@ get_schema_impl <- function(
           DBI::dbQuoteIdentifier(conn, table_name)
         )
         result <- DBI::dbGetQuery(conn, prep_query(stats_query))
-        if (nrow(result) > 0) {
-          column_stats <- as.list(result[1, ])
-        }
+        if (nrow(result) > 0) column_stats <- as.list(result[1, ])
       },
-      error = function(e) {
-        # Fall back to no statistics if query fails
-      }
+      error = function(e) {}
     )
   }
 
-  # Get categorical values for text columns below threshold
   categorical_values <- list()
   text_cols_to_query <- character(0)
-
   for (col_name in text_columns) {
+    if (!is.null(documented[[col_name]][["values"]])) {
+      next
+    }
     distinct_count_key <- paste0(col_name, "__distinct_count")
     if (
       distinct_count_key %in%
@@ -303,11 +332,7 @@ get_schema_impl <- function(
       text_cols_to_query <- c(text_cols_to_query, col_name)
     }
   }
-
-  # Remove duplicates
   text_cols_to_query <- unique(text_cols_to_query)
-
-  # Get categorical values
   if (length(text_cols_to_query) > 0) {
     for (col_name in text_cols_to_query) {
       tryCatch(
@@ -323,61 +348,131 @@ get_schema_impl <- function(
             DBI::dbQuoteIdentifier(conn, col_name)
           )
           result <- DBI::dbGetQuery(conn, prep_query(cat_query))
-          if (nrow(result) > 0) {
-            categorical_values[[col_name]] <- result[[1]]
-          }
+          if (nrow(result) > 0) categorical_values[[col_name]] <- result[[1]]
         },
-        error = function(e) {
-          # Skip categorical values if query fails
-        }
+        error = function(e) {}
       )
     }
   }
 
-  # Build schema description
-  for (col in columns) {
+  # Build structured column details (NA_character_ serialises to JSON null via jsonlite)
+  lapply(columns, function(col) {
+    spec <- documented[[col]]
     col_class <- class(sample_data[[col]])[1]
-    sql_type <- r_class_to_sql_type(col_class)
-
-    column_info <- paste0("- ", col, " (", sql_type, ")")
+    sql_type <- spec[["type"]] %||% r_class_to_sql_type(col_class)
+
+    min_val <- NA_character_
+    max_val <- NA_character_
+    categories <- list()
+    constraints <- if (length(spec[["constraints"]]) > 0) {
+      as.list(spec[["constraints"]])
+    } else {
+      list()
+    }
 
-    # Add range info for numeric columns
     if (col %in% numeric_columns) {
-      min_key <- paste0(col, "__min")
-      max_key <- paste0(col, "__max")
-      if (
-        min_key %in%
-          names(column_stats) &&
-          max_key %in% names(column_stats) &&
-          !is.na(column_stats[[min_key]]) &&
-          !is.na(column_stats[[max_key]])
-      ) {
-        range_info <- paste0(
-          "  Range: ",
-          column_stats[[min_key]],
-          " to ",
-          column_stats[[max_key]]
-        )
-        column_info <- paste(column_info, range_info, sep = "\n")
+      if (!is.null(spec[["range"]])) {
+        min_val <- as.character(spec[["range"]][["min"]] %||% "?")
+        max_val <- as.character(spec[["range"]][["max"]] %||% "?")
+      } else {
+        min_key <- paste0(col, "__min")
+        max_key <- paste0(col, "__max")
+        if (
+          min_key %in%
+            names(column_stats) &&
+            max_key %in% names(column_stats) &&
+            !is.na(column_stats[[min_key]]) &&
+            !is.na(column_stats[[max_key]])
+        ) {
+          min_val <- as.character(column_stats[[min_key]])
+          max_val <- as.character(column_stats[[max_key]])
+        }
       }
-    }
-
-    # Add categorical values for text columns
-    if (col %in% names(categorical_values)) {
-      values <- categorical_values[[col]]
-      if (length(values) > 0) {
-        values_str <- paste0("'", values, "'", collapse = ", ")
-        cat_info <- paste0("  Categorical values: ", values_str)
-        column_info <- paste(column_info, cat_info, sep = "\n")
+    } else if (col %in% text_columns) {
+      if (!is.null(spec[["values"]])) {
+        categories <- as.list(as.character(spec[["values"]]))
+      } else if (col %in% names(categorical_values)) {
+        vals <- categorical_values[[col]]
+        if (length(vals) > 0) categories <- as.list(as.character(vals))
       }
     }
 
-    schema_lines <- c(schema_lines, column_info)
-  }
+    list(
+      name = col,
+      sql_type = sql_type,
+      units = spec[["units"]] %||% NA_character_,
+      description = spec[["description"]] %||% NA_character_,
+      min_val = min_val,
+      max_val = max_val,
+      categories = categories,
+      constraints = constraints
+    )
+  })
+}
 
+# Format a list of column details (from build_column_details_impl) into LLM schema text.
+format_schema_from_details <- function(table_name_display, details) {
+  schema_lines <- c(paste("Table:", table_name_display), "Columns:")
+  for (col in details) {
+    line <- paste0("- ", col$name, " (", col$sql_type, ")")
+    if (!is.na(col$units)) {
+      line <- paste0(line, " [", col$units, "]")
+    }
+    if (!is.na(col$description)) {
+      line <- paste(
+        line,
+        paste0("  Description: ", col$description),
+        sep = "\n"
+      )
+    }
+    if (length(col$constraints) > 0) {
+      line <- paste(
+        line,
+        paste0("  Constraints: ", paste(col$constraints, collapse = ", ")),
+        sep = "\n"
+      )
+    }
+    if (!is.na(col$min_val) && !is.na(col$max_val)) {
+      line <- paste(
+        line,
+        paste0("  Range: ", col$min_val, " to ", col$max_val),
+        sep = "\n"
+      )
+    } else if (length(col$categories) > 0) {
+      values_str <- paste0("'", col$categories, "'", collapse = ", ")
+      line <- paste(
+        line,
+        paste0("  Categorical values: ", values_str),
+        sep = "\n"
+      )
+    }
+    schema_lines <- c(schema_lines, line)
+  }
   paste(schema_lines, collapse = "\n")
 }
 
+get_schema_impl <- function(
+  conn,
+  table_name,
+  categorical_threshold = 20,
+  columns = NULL,
+  prep_query = identity,
+  table_spec = NULL
+) {
+  check_function(prep_query)
+  details <- build_column_details_impl(
+    conn,
+    table_name,
+    categorical_threshold,
+    columns = columns,
+    prep_query = prep_query,
+    table_spec = table_spec
+  )
+  format_schema_from_details(
+    as.character(DBI::dbQuoteIdentifier(conn, table_name)),
+    details
+  )
+}
 
 # nocov start
 # Map R classes to SQL types
diff --git a/pkg-r/R/DataDict.R b/pkg-r/R/DataDict.R
new file mode 100644
index 000000000..04b59651c
--- /dev/null
+++ b/pkg-r/R/DataDict.R
@@ -0,0 +1,74 @@
+#' Read a Data Dictionary from YAML
+#'
+#' @description
+#' Loads a data dictionary from a YAML file conforming to the
+#' [data-dict spec](https://data-dict.tidyverse.org/). The dictionary is
+#' returned as a plain list and can be passed directly to [QueryChat] via the
+#' `data_dict` argument.
+#'
+#' If `name` is absent from the YAML file, it defaults to the file stem.
+#'
+#' @param path Path to the YAML file.
+#'
+#' @return A named list with the structure of the YAML file.
+read_data_dict <- function(path) {
+  check_installed("yaml")
+  check_string(path)
+
+  dd <- yaml::read_yaml(path) %||% list()
+
+  if (is.null(dd[["name"]])) {
+    dd[["name"]] <- tools::file_path_sans_ext(basename(path))
+  }
+
+  dd
+}
+
+#' Convert a data dict list to a filtered list for system prompt rendering.
+#'
+#' Keeps table descriptions (for LLM context), strips per-column details.
+#' Relationships and glossary are passed through as-is (NULL fields dropped).
+#'
+#' @param dd A data dict list (from [read_data_dict()]).
+#' @return A named list suitable for inclusion in the system prompt template.
+#' @noRd
+data_dict_to_prompt_list <- function(dd) {
+  result <- list()
+
+  if (!is.null(dd[["name"]])) {
+    result[["name"]] <- dd[["name"]]
+  }
+  if (!is.null(dd[["description"]])) {
+    result[["description"]] <- dd[["description"]]
+  }
+  if (length(dd[["tables"]]) > 0) {
+    result[["tables"]] <- lapply(dd[["tables"]], function(ts) {
+      if (is.null(ts[["description"]])) {
+        NULL
+      } else {
+        list(description = ts[["description"]])
+      }
+    })
+  }
+  if (length(dd[["relationships"]]) > 0) {
+    result[["relationships"]] <- lapply(dd[["relationships"]], function(rs) {
+      compact(
+        list(
+          join = rs[["join"]],
+          description = rs[["description"]],
+          cardinality = rs[["cardinality"]]
+        )
+      )
+    })
+  }
+  if (length(dd[["glossary"]]) > 0) {
+    result[["glossary"]] <- dd[["glossary"]]
+  }
+
+  result
+}
+
+#' @noRd
+compact <- function(x) {
+  x[!vapply(x, is.null, logical(1))]
+}
diff --git a/pkg-r/R/DataFrameSource.R b/pkg-r/R/DataFrameSource.R
index f03455ebe..edded59f8 100644
--- a/pkg-r/R/DataFrameSource.R
+++ b/pkg-r/R/DataFrameSource.R
@@ -70,6 +70,21 @@ DataFrameSource <- R6::R6Class(
       private$colnames <- colnames(df)
 
       private$conn <- new_dataframe_connection(df, table_name, engine)
+    },
+
+    #' @description
+    #' Disconnect from the database and shut down the DuckDB instance if used.
+    #'
+    #' @return NULL (invisibly)
+    cleanup = function() {
+      if (!is.null(private$conn) && DBI::dbIsValid(private$conn)) {
+        if (inherits(private$conn, "duckdb_connection")) {
+          DBI::dbDisconnect(private$conn, shutdown = TRUE)
+        } else {
+          DBI::dbDisconnect(private$conn)
+        }
+      }
+      invisible(NULL)
     }
   )
 )
@@ -98,10 +113,12 @@ get_default_dataframe_engine <- function() {
   if (is_installed("RSQLite")) {
     return("sqlite")
   }
-  cli::cli_abort(c(
-    "No compatible database engine installed for DataFrameSource",
-    "i" = "Install either {.pkg duckdb} or {.pkg RSQLite}:",
-    " " = "{.run install.packages(\"duckdb\")}",
-    " " = "{.run install.packages(\"RSQLite\")}"
-  ))
+  cli::cli_abort(
+    c(
+      "No compatible database engine installed for DataFrameSource",
+      "i" = "Install either {.pkg duckdb} or {.pkg RSQLite}:",
+      " " = "{.run install.packages(\"duckdb\")}",
+      " " = "{.run install.packages(\"RSQLite\")}"
+    )
+  )
 }
diff --git a/pkg-r/R/DataSource.R b/pkg-r/R/DataSource.R
index 4fc3e74b6..fe4c1539d 100644
--- a/pkg-r/R/DataSource.R
+++ b/pkg-r/R/DataSource.R
@@ -45,13 +45,23 @@ DataSource <- R6::R6Class(
     #' @param categorical_threshold Maximum number of unique values for a text
     #'   column to be considered categorical
     #' @return A string containing schema information formatted for LLM prompts
-    get_schema = function(categorical_threshold = 20) {
+    get_schema = function(categorical_threshold = 20, table_spec = NULL) {
       cli::cli_abort(
         "{.fn get_schema} must be implemented by subclass",
         class = "not_implemented_error"
       )
     },
 
+    get_schema_result = function(
+      categorical_threshold = 20,
+      table_spec = NULL
+    ) {
+      cli::cli_abort(
+        "{.fn get_schema_result} must be implemented by subclass",
+        class = "not_implemented_error"
+      )
+    },
+
     #' @description
     #' Execute a SQL query and return results
     #'
diff --git a/pkg-r/R/PinSource.R b/pkg-r/R/PinSource.R
index da678f81b..84bbde013 100644
--- a/pkg-r/R/PinSource.R
+++ b/pkg-r/R/PinSource.R
@@ -134,10 +134,12 @@ PinSource <- R6::R6Class(
         duckdb_lock_down(con)
       } else {
         if (engine == "sqlite" && pin_type %in% duckdb_file_types) {
-          cli::cli_warn(c(
-            "Reading {pin_type} pin {.val {name}} into SQLite.",
-            "i" = "The {.pkg duckdb} engine reads {pin_type} pins more efficiently. Install {.pkg duckdb} or pass {.code engine = \"duckdb\"} to read the pin files directly."
-          ))
+          cli::cli_warn(
+            c(
+              "Reading {pin_type} pin {.val {name}} into SQLite.",
+              "i" = "The {.pkg duckdb} engine reads {pin_type} pins more efficiently. Install {.pkg duckdb} or pass {.code engine = \"duckdb\"} to read the pin files directly."
+            )
+          )
         }
         data <- pins::pin_read(board, name, version = version)
         if (!is.data.frame(data)) {
diff --git a/pkg-r/R/QueryChat.R b/pkg-r/R/QueryChat.R
index 75496c746..576d9abce 100644
--- a/pkg-r/R/QueryChat.R
+++ b/pkg-r/R/QueryChat.R
@@ -15,7 +15,7 @@
 #' - Initialize server logic that returns session-specific reactive values (via
 #'   `$server()`)
 #' - Access reactive data, SQL queries, and titles through the returned server
-#'   values
+#'   values (use `qc_vals$table("name")` for multi-table access)
 #'
 #' @section Usage in Shiny Apps:
 #' ```r
@@ -89,9 +89,10 @@
 QueryChat <- R6::R6Class(
   "QueryChat",
   private = list(
-    server_values = NULL,
-    .data_source = NULL,
-    .table_name = NULL,
+    .data_sources = list(),
+    .deferred_table_name = NULL,
+    .query_executor = NULL,
+    .server_initialized = FALSE,
     .client_spec = NULL,
     .client_console = NULL,
     .system_prompt = NULL,
@@ -101,24 +102,27 @@ QueryChat <- R6::R6Class(
     .data_description_mode = "empty", # "supplied", "inferred", or "empty"
     .extra_instructions = NULL,
     .categorical_threshold = NULL,
+    .data_dicts = list(),
 
-    require_data_source = function(method_name) {
-      if (is.null(private$.data_source)) {
+    require_initialized = function(method_name) {
+      if (length(private$.data_sources) == 0) {
         cli::cli_abort(
           "{.arg data_source} must be set before calling {.fn ${method_name}}.
-           Either pass {.arg data_source} to {.fn $new}, set the
-           {.field $data_source} property, or pass {.arg data_source} to {.fn $server}."
+           Either pass {.arg data_source} to {.fn $new}, or call {.fn $add_table}."
         )
       }
     },
 
-    auto_fill_data_description = function() {
+    auto_fill_data_description = function(sources = private$.data_sources) {
+      if (length(sources) != 1) {
+        return()
+      }
       if (private$.data_description_mode == "inferred") {
         private$.data_description <- NULL
         private$.data_description_mode <- "empty"
       }
       if (private$.data_description_mode == "empty") {
-        desc <- private$.data_source$get_data_description()
+        desc <- sources[[1]]$get_data_description()
         if (nzchar(desc %||% "")) {
           private$.data_description <- desc
           private$.data_description_mode <- "inferred"
@@ -126,26 +130,22 @@ QueryChat <- R6::R6Class(
       }
     },
 
-    build_system_prompt = function() {
-      if (is.null(private$.data_source)) {
-        cli::cli_abort("Cannot build system prompt without data_source")
+    build_system_prompt = function(data_sources = NULL) {
+      sources <- data_sources %||% private$.data_sources
+      if (length(sources) == 0) {
+        cli::cli_abort("Cannot build system prompt without data sources")
       }
 
-      prompt_template <- private$.prompt_template
-      if (is.null(prompt_template)) {
-        prompt_template <- system.file(
-          "prompts",
-          "prompt.md",
-          package = "querychat"
-        )
-      }
+      prompt_template <- private$.prompt_template %||%
+        system.file("prompts", "prompt.md", package = "querychat")
 
       private$.system_prompt <- QueryChatSystemPrompt$new(
         prompt_template = prompt_template,
-        data_source = private$.data_source,
+        data_sources = sources,
         data_description = private$.data_description,
         extra_instructions = private$.extra_instructions,
-        categorical_threshold = private$.categorical_threshold
+        categorical_threshold = private$.categorical_threshold,
+        data_dicts = private$.data_dicts
       )
     },
 
@@ -153,8 +153,8 @@ QueryChat <- R6::R6Class(
       client_spec = NULL,
       tools = NA,
       session = NULL,
-      update_dashboard = function(query, title) {},
-      reset_dashboard = function() {},
+      update_dashboard = function(query, title, table) {},
+      reset_dashboard = function(table) {},
       visualize = function(data) {}
     ) {
       spec <- client_spec %||% private$.client_spec
@@ -172,18 +172,40 @@ QueryChat <- R6::R6Class(
         return(chat)
       }
 
+      # Build executor lazily
+      if (is.null(private$.query_executor)) {
+        private$.query_executor <- build_query_executor(private$.data_sources)
+      }
+      executor <- private$.query_executor
+      tbl_names <- names(private$.data_sources)
+
+      # Always register get_schema tool
+      chat$register_tool(
+        tool_get_schema(
+          private$.data_dicts,
+          executor,
+          tbl_names,
+          private$.categorical_threshold
+        )
+      )
+
       if ("update" %in% tools) {
         chat$register_tool(
           tool_update_dashboard(
-            private$.data_source,
+            executor,
+            tbl_names,
             update_fn = update_dashboard
           )
         )
-        chat$register_tool(tool_reset_dashboard(reset_dashboard))
+        chat$register_tool(
+          tool_reset_dashboard(reset_dashboard, table_names = tbl_names)
+        )
       }
 
       if ("query" %in% tools) {
-        chat$register_tool(tool_query(private$.data_source))
+        chat$register_tool(
+          tool_query(executor, multi_table = length(tbl_names) > 1)
+        )
       }
 
       if ("visualize" %in% tools) {
@@ -193,7 +215,7 @@ QueryChat <- R6::R6Class(
         )
         chat$register_tool(
           tool_visualize_dashboard(
-            private$.data_source,
+            executor,
             session = session,
             update_fn = visualize,
             has_tool_query = "query" %in% tools
@@ -209,6 +231,8 @@ QueryChat <- R6::R6Class(
     greeting = NULL,
     #' @field id ID for the QueryChat instance.
     id = NULL,
+    #' @field id_override Whether the ID was explicitly set by the user.
+    id_override = NULL,
     #' @field tools The allowed tools for the chat client.
     tools = c("filter", "query"),
 
@@ -217,8 +241,8 @@ QueryChat <- R6::R6Class(
     #'
     #' @param data_source Either a data.frame, a database connection (e.g., DBI
     #'   connection), or `NULL` to defer setting the data source until later.
-    #'   When `NULL`, the data source must be set via the `$data_source` property
-    #'   or passed to `$server()` before calling methods that require data access.
+    #'   When `NULL`, the data source must be added via `$add_table()` or passed
+    #'   to `$server()` before calling methods that require data access.
     #' @param table_name A string specifying the table name to use in SQL
     #'   queries. If `data_source` is a data.frame, this is the name to refer to
     #'   it by in queries (typically the variable name). If not provided, will
@@ -257,6 +281,8 @@ QueryChat <- R6::R6Class(
     #'   template file. If not provided, the default querychat template will be
     #'   used. See the package prompts directory for the default template
     #'   format.
+    #' @param data_dict Optional data dictionary. A path to a YAML file, or a
+    #'   list of YAML file paths. See [read_data_dict()] for the expected format.
     #' @param cleanup Whether or not to automatically run `$cleanup()` when the
     #'   Shiny session/app stops. By default, cleanup only occurs if `QueryChat`
     #'   gets created within a Shiny session. Set to `TRUE` to always clean up,
@@ -275,6 +301,7 @@ QueryChat <- R6::R6Class(
       categorical_threshold = 20,
       extra_instructions = NULL,
       prompt_template = NULL,
+      data_dict = NULL,
       cleanup = NA
     ) {
       check_dots_empty()
@@ -294,28 +321,8 @@ QueryChat <- R6::R6Class(
       check_string(prompt_template, allow_null = TRUE)
       check_bool(cleanup, allow_na = TRUE)
 
-      # Handle table_name inference for non-NULL data sources
-      if (is_missing(table_name)) {
-        if (is.null(data_source)) {
-          cli::cli_abort(
-            "{.arg table_name} is required when {.arg data_source} is {.val NULL}."
-          )
-        }
-        if (inherits(data_source, "DataSource")) {
-          table_name <- data_source$table_name
-        } else if (
-          is.data.frame(data_source) || inherits(data_source, "tbl_sql")
-        ) {
-          table_name <- deparse1(substitute(data_source))
-        } else if (inherits(data_source, "pins_board")) {
-          cli::cli_abort(
-            "{.arg table_name} (the pin name) is required when {.arg data_source} is a pins board."
-          )
-        }
-      }
-
-      # Store table_name for later normalization (needed for deferred pattern)
-      private$.table_name <- table_name
+      # Normalize data_dicts
+      private$.data_dicts <- normalize_data_dicts(data_dict)
 
       # Store init parameters for deferred system prompt building
       private$.prompt_template <- prompt_template
@@ -328,25 +335,48 @@ QueryChat <- R6::R6Class(
       private$.extra_instructions <- extra_instructions
       private$.categorical_threshold <- categorical_threshold
 
-      self$id <- id %||% sprintf("querychat_%s", table_name)
       self$tools <- tools
+      private$.client_spec <- client
 
       if (!is.null(greeting) && file.exists(greeting)) {
         greeting <- read_utf8(greeting)
       }
       self$greeting <- greeting
 
-      # Initialize data source (may be NULL for deferred pattern)
+      # Track whether id was explicitly set
+      self$id_override <- id
+
+      # Handle table_name inference for non-NULL data sources
       if (!is.null(data_source)) {
-        private$.data_source <- normalize_data_source(data_source, table_name)
-        private$.table_name <- private$.data_source$table_name
-        self$id <- id %||% sprintf("querychat_%s", private$.table_name)
+        if (is_missing(table_name)) {
+          if (inherits(data_source, "DataSource")) {
+            table_name <- data_source$table_name
+          } else if (
+            is.data.frame(data_source) || inherits(data_source, "tbl_sql")
+          ) {
+            table_name <- deparse1(substitute(data_source))
+          } else if (inherits(data_source, "pins_board")) {
+            cli::cli_abort(
+              "{.arg table_name} (the pin name) is required when {.arg data_source} is a pins board."
+            )
+          }
+        }
+        normalized <- normalize_data_source(data_source, table_name)
+        private$.data_sources[[normalized$table_name]] <- normalized
         private$auto_fill_data_description()
         private$build_system_prompt()
+        self$id <- id %||% sprintf("querychat_%s", normalized$table_name)
+      } else {
+        # Deferred pattern: data_source is NULL
+        if (is_missing(table_name)) {
+          cli::cli_abort(
+            "{.arg table_name} is required when {.arg data_source} is {.val NULL}."
+          )
+        }
+        private$.deferred_table_name <- table_name
+        self$id <- id %||% sprintf("querychat_%s", table_name)
       }
 
-      private$.client_spec <- client
-
       # By default, only close automatically if a Shiny session is active
       if (is.na(cleanup)) {
         cleanup <- shiny::isRunning()
@@ -360,6 +390,187 @@ QueryChat <- R6::R6Class(
       }
     },
 
+    #' @description
+    #' Add a table to this QueryChat instance.
+    #'
+    #' @param data_source A data frame, database connection, or DataSource object.
+    #' @param table_name The SQL table name for this data source.
+    #' @param replace Whether to replace an existing table with this name.
+    #'   Default is `FALSE`.
+    #'
+    #' @return Invisibly returns `self` for chaining.
+    add_table = function(data_source, table_name, replace = FALSE) {
+      if (private$.server_initialized) {
+        cli::cli_abort("Cannot add tables after server initialization.")
+      }
+      check_sql_table_name(table_name)
+      if (table_name %in% names(private$.data_sources) && !replace) {
+        cli::cli_abort(
+          "Table {.val {table_name}} already exists. Use {.code replace = TRUE} to replace."
+        )
+      }
+      normalized <- normalize_data_source(data_source, table_name)
+
+      other_sources <- private$.data_sources[
+        names(private$.data_sources) != table_name
+      ]
+      check_source_compatibility(other_sources, normalized, table_name)
+
+      next_sources <- private$.data_sources
+      next_sources[[table_name]] <- normalized
+
+      private$auto_fill_data_description(next_sources)
+      tryCatch(
+        {
+          private$build_system_prompt(data_sources = next_sources)
+        },
+        error = function(e) {
+          if (!inherits(data_source, "DataSource")) {
+            normalized$cleanup()
+          }
+          stop(e)
+        }
+      )
+
+      old_source <- private$.data_sources[[table_name]]
+      private$.data_sources <- next_sources
+      if (!is.null(old_source) && !identical(old_source, normalized)) {
+        old_source$cleanup()
+      }
+
+      if (!is.null(private$.query_executor)) {
+        tryCatch(private$.query_executor$cleanup(), error = function(e) NULL)
+        private$.query_executor <- NULL
+      }
+
+      if (length(private$.data_sources) == 1 && is.null(self$id_override)) {
+        self$id <- sprintf("querychat_%s", table_name)
+      }
+
+      invisible(self)
+    },
+
+    #' @description
+    #' Add multiple tables from a DBI connection in a single call.
+    #'
+    #' Unlike calling `$add_table()` repeatedly, this method builds the
+    #' system prompt exactly once after all tables have been staged, avoiding
+    #' N-1 spurious intermediate rebuilds.
+    #'
+    #' @param conn A DBI connection. Only DBI connections are supported; pass
+    #'   individual data frames or other sources via `$add_table()`.
+    #' @param tables Table names to register. When `NULL`, all tables returned
+    #'   by `DBI::dbListTables(conn)` are used.
+    #' @param replace Whether to replace existing tables with the same name.
+    #'   Default is `FALSE`.
+    #'
+    #' @return Invisibly returns `self` for chaining.
+    add_tables = function(conn, tables = NULL, replace = FALSE) {
+      if (private$.server_initialized) {
+        cli::cli_abort("Cannot add tables after server initialization.")
+      }
+      if (!inherits(conn, "DBIConnection")) {
+        cli::cli_abort(
+          "{.fn add_tables} requires a {.cls DBIConnection}, not {.obj_type_friendly {conn}}.",
+          "i" = "Use {.fn add_table} for data frames and other source types."
+        )
+      }
+      if (is.null(tables)) {
+        tables <- DBI::dbListTables(conn)
+      }
+      if (length(tables) == 0) {
+        cli::cli_abort("No tables found in database.")
+      }
+      for (table_name in tables) {
+        check_sql_table_name(table_name)
+        if (table_name %in% names(private$.data_sources) && !replace) {
+          cli::cli_abort(
+            "Table {.val {table_name}} already exists. Use {.code replace = TRUE} to replace."
+          )
+        }
+      }
+
+      normalized <- stats::setNames(
+        lapply(tables, function(tbl) normalize_data_source(conn, tbl)),
+        tables
+      )
+
+      staged <- list()
+      for (table_name in tables) {
+        other_sources <- private$.data_sources[
+          names(private$.data_sources) != table_name
+        ]
+        check_source_compatibility(
+          c(other_sources, staged),
+          normalized[[table_name]],
+          table_name
+        )
+        staged[[table_name]] <- normalized[[table_name]]
+      }
+
+      next_sources <- private$.data_sources
+      for (table_name in tables) {
+        next_sources[[table_name]] <- normalized[[table_name]]
+      }
+
+      private$auto_fill_data_description(next_sources)
+      private$build_system_prompt(data_sources = next_sources)
+
+      for (table_name in tables) {
+        old_source <- private$.data_sources[[table_name]]
+        if (
+          !is.null(old_source) &&
+            !identical(old_source, normalized[[table_name]])
+        ) {
+          old_source$cleanup()
+        }
+      }
+      private$.data_sources <- next_sources
+
+      if (!is.null(private$.query_executor)) {
+        tryCatch(private$.query_executor$cleanup(), error = function(e) NULL)
+        private$.query_executor <- NULL
+      }
+
+      invisible(self)
+    },
+
+    #' @description
+    #' Remove a table from this QueryChat instance.
+    #'
+    #' @param table_name The name of the table to remove.
+    #'
+    #' @return Invisibly returns `self` for chaining.
+    remove_table = function(table_name) {
+      if (private$.server_initialized) {
+        cli::cli_abort("Cannot remove tables after server initialization.")
+      }
+      if (!table_name %in% names(private$.data_sources)) {
+        cli::cli_abort("Table {.val {table_name}} not found.")
+      }
+      if (length(private$.data_sources) == 1) {
+        cli::cli_abort(
+          "Cannot remove last table. At least one table is required."
+        )
+      }
+      removed <- private$.data_sources[[table_name]]
+      next_sources <- private$.data_sources[
+        names(private$.data_sources) != table_name
+      ]
+      private$build_system_prompt(data_sources = next_sources)
+      private$.data_sources <- next_sources
+      if (!is.null(private$.query_executor)) {
+        tryCatch(private$.query_executor$cleanup(), error = function(e) NULL)
+        private$.query_executor <- NULL
+      }
+      removed$cleanup()
+      invisible(self)
+    },
+
+    #' @description
+    #' Return the names of all registered tables.
+    table_names = function() names(private$.data_sources),
+
     #' @description
     #' Create a chat client, complete with registered tools, for the current
     #' data source.
@@ -369,10 +580,10 @@ QueryChat <- R6::R6Class(
     #'   and `"query"` includes the tool for executing SQL queries. By default,
     #'   when `tools = NA`, the values provided at initialization are used.
     #'   The legacy name `"update"` is still accepted as an alias for `"filter"`.
-    #' @param update_dashboard Optional function to call with the `query` and
-    #'   `title` generated by the LLM for the `update_dashboard` tool.
+    #' @param update_dashboard Optional function to call with the `query`,
+    #'   `title`, and `table` generated by the LLM for the `update_dashboard` tool.
     #' @param reset_dashboard Optional function to call when the
-    #'   `reset_dashboard` tool is called.
+    #'   `reset_dashboard` tool is called. Takes a `table` argument.
     #' @param visualize Optional function to call with a list containing
     #'   `ggsql`, `title`, and `widget_id` when a visualization succeeds.
     #' @param session A Shiny session object. Required when `"visualize"` is
@@ -381,12 +592,12 @@ QueryChat <- R6::R6Class(
     #'   as Shiny outputs.
     client = function(
       tools = NA,
-      update_dashboard = function(query, title) {},
-      reset_dashboard = function() {},
+      update_dashboard = function(query, title, table) {},
+      reset_dashboard = function(table) {},
       visualize = function(data) {},
       session = NULL
     ) {
-      private$require_data_source("$client")
+      private$require_initialized("$client")
 
       if (!is_na(tools) && !is.null(tools)) {
         tools <- arg_match(
@@ -417,7 +628,7 @@ QueryChat <- R6::R6Class(
     #'   By default, only the `"query"` tool is included, regardless of the
     #'   `tools` set at initialization.
     console = function(new = FALSE, ..., tools = "query") {
-      private$require_data_source("$console")
+      private$require_initialized("$console")
       check_bool(new)
       if (new || is.null(private$.client_console)) {
         private$.client_console <- self$client(tools = tools, ...)
@@ -429,28 +640,12 @@ QueryChat <- R6::R6Class(
     #' @description
     #' Create and run a Shiny gadget for chatting with data
     #'
-    #' Runs a Shiny gadget (designed for interactive use) that provides a
-    #' complete interface for chatting with your data using natural language. If
-    #' you're looking to deploy this app or run it through some other means, see
-    #' `$app_obj()`.
-    #'
-    #' ```r
-    #' library(querychat)
-    #'
-    #' qc <- QueryChat$new(mtcars)
-    #' qc$app()
-    #' ```
-    #'
     #' @param ... Arguments passed to `$app_obj()`.
     #' @param bookmark_store The bookmarking storage method. Passed to
     #'   [shiny::enableBookmarking()]. If `"url"` or `"server"`, the chat state
     #'   (including current query) will be bookmarked. Default is `"url"`.
     #'
-    #' @return Invisibly returns a list of session-specific values:
-    #'  - `df`: The final filtered data frame
-    #'  - `sql`: The final SQL query string
-    #'  - `title`: The final title
-    #'  - `client`: The session-specific chat client instance
+    #' @return Invisibly returns a list of session-specific values.
     app = function(..., bookmark_store = "url") {
       app <- self$app_obj(..., bookmark_store = bookmark_store)
       vals <- tryCatch(shiny::runGadget(app), interrupt = function(cnd) NULL)
@@ -460,39 +655,24 @@ QueryChat <- R6::R6Class(
     #' @description
     #' A streamlined Shiny app for chatting with data
     #'
-    #' Creates a Shiny app designed for chatting with data, with:
-    #' - A sidebar containing the chat interface
-    #' - A card displaying the current SQL query
-    #' - A card displaying the filtered data table
-    #' - A reset button to clear the query
-    #'
-    #' ```r
-    #' library(querychat)
-    #'
-    #' qc <- QueryChat$new(mtcars)
-    #' app <- qc$app_obj()
-    #' shiny::runApp(app)
-    #' ```
-    #'
     #' @param ... Additional arguments (currently unused).
     #' @param bookmark_store The bookmarking storage method. Passed to
-    #'  [shiny::enableBookmarking()]. If `"url"` or `"server"`, the chat state
-    #'  (including current query) will be bookmarked. Default is `"url"`.
+    #'  [shiny::enableBookmarking()]. Default is `"url"`.
     #'
     #' @return A Shiny app object that can be run with `shiny::runApp()`.
     app_obj = function(..., bookmark_store = "url") {
-      private$require_data_source("$app_obj")
+      private$require_initialized("$app_obj")
       check_installed("DT")
       check_dots_empty()
 
-      table_name <- private$.data_source$table_name
+      first_table_name <- names(private$.data_sources)[[1]]
 
       ui <- function(req) {
         bslib::page_sidebar(
           title = shiny::HTML(
             sprintf(
               "<span>querychat with <code>%s</code></span>",
-              table_name
+              first_table_name
             )
           ),
           class = "bslib-page-dashboard",
@@ -518,7 +698,11 @@ QueryChat <- R6::R6Class(
           ),
           bslib::card(
             full_screen = TRUE,
-            bslib::card_header(bsicons::bs_icon("table"), "Data"),
+            bslib::card_header(
+              bsicons::bs_icon("table"),
+              "Data \u2014 ",
+              shiny::textOutput("data_card_header_text", inline = TRUE)
+            ),
             DT::DTOutput("dt")
           ),
           shiny::actionButton(
@@ -532,21 +716,25 @@ QueryChat <- R6::R6Class(
 
       server <- function(input, output, session) {
         shiny::setBookmarkExclude(c("close_btn", "reset_query"))
-        # Enable bookmarking if bookmark_store is enabled
         enable_bookmarking <- bookmark_store %in% c("url", "server")
         qc_vals <- self$server(enable_bookmarking = enable_bookmarking)
 
+        active_table_name <- shiny::reactive({
+          ct <- qc_vals$current_table()
+          if (!is.null(ct)) ct else first_table_name
+        })
+
+        output$data_card_header_text <- shiny::renderText({
+          active_table_name()
+        })
+
         output$query_title <- shiny::renderText({
-          if (shiny::isTruthy(qc_vals$title())) {
-            qc_vals$title()
-          } else {
-            "SQL Query"
-          }
+          title <- qc_vals$.tables[[active_table_name()]]$title()
+          if (shiny::isTruthy(title)) title else "SQL Query"
         })
 
         output$ui_reset <- shiny::renderUI({
-          shiny::req(qc_vals$sql())
-
+          shiny::req(qc_vals$.tables[[active_table_name()]]$sql())
           shiny::actionButton(
             "reset_query",
             label = "Reset Query",
@@ -555,17 +743,16 @@ QueryChat <- R6::R6Class(
         })
 
         shiny::observeEvent(input$reset_query, label = "on_reset_query", {
-          qc_vals$sql(NULL)
-          qc_vals$title(NULL)
+          name <- active_table_name()
+          qc_vals$.tables[[name]]$sql(NULL)
+          qc_vals$.tables[[name]]$title(NULL)
         })
 
         output$dt <- DT::renderDT({
-          df <- qc_vals$df()
+          df <- qc_vals$.tables[[active_table_name()]]$df()
           if (inherits(df, "tbl_sql")) {
-            # Materialize the query for DT, {dplyr} guaranteed by TblSqlSource
             df <- dplyr::collect(df)
           }
-
           DT::datatable(
             df,
             fillContainer = TRUE,
@@ -574,14 +761,14 @@ QueryChat <- R6::R6Class(
         })
 
         output$sql_output <- shiny::renderUI({
-          sql <- if (shiny::isTruthy(qc_vals$sql())) {
-            qc_vals$sql()
+          name <- active_table_name()
+          sql <- qc_vals$.tables[[name]]$sql()
+          sql_text <- if (shiny::isTruthy(sql)) {
+            sql
           } else {
-            paste("SELECT * FROM", table_name)
+            paste("SELECT * FROM", name)
           }
-
-          sql_code <- paste(c("```sql", sql, "```"), collapse = "\n")
-
+          sql_code <- paste(c("```sql", sql_text, "```"), collapse = "\n")
           shinychat::output_markdown_stream(
             "sql_code",
             content = sql_code,
@@ -591,11 +778,12 @@ QueryChat <- R6::R6Class(
         })
 
         shiny::observeEvent(input$close_btn, label = "on_close_btn", {
+          name <- active_table_name()
           shiny::stopApp(
             list(
-              df = qc_vals$df(),
-              sql = qc_vals$sql(),
-              title = qc_vals$title(),
+              df = qc_vals$.tables[[name]]$df(),
+              sql = qc_vals$.tables[[name]]$sql(),
+              title = qc_vals$.tables[[name]]$title(),
               client = qc_vals$client
             )
           )
@@ -608,28 +796,12 @@ QueryChat <- R6::R6Class(
     #' @description
     #' Create a sidebar containing the querychat UI.
     #'
-    #' This method generates a [bslib::sidebar()] component containing the chat
-    #' interface, suitable for use with [bslib::page_sidebar()] or similar
-    #' layouts.
-    #'
-    #' ```r
-    #' qc <- QueryChat$new(mtcars)
-    #'
-    #' ui <- page_sidebar(
-    #'   qc$sidebar(),
-    #'   # Main content here
-    #' )
-    #' ```
-    #'
     #' @param ... Additional arguments passed to [bslib::sidebar()].
     #' @param width Width of the sidebar in pixels. Default is 400.
     #' @param height Height of the sidebar. Default is "100%".
     #' @param fillable Whether the sidebar should be fillable. Default is
     #'   `TRUE`.
-    #' @param id Optional ID for the QueryChat instance. If not provided, will
-    #'   use the ID provided at initialization. If using `$sidebar()` in a Shiny
-    #'   module, you'll need to provide `id = ns("your_id")` where `ns` is the
-    #'   namespacing function from [shiny::NS()].
+    #' @param id Optional ID for the QueryChat instance.
     #'
     #' @return A [bslib::sidebar()] UI component.
     sidebar = function(
@@ -652,33 +824,13 @@ QueryChat <- R6::R6Class(
     #' @description
     #' Create the UI for the querychat chat interface.
     #'
-    #' This method generates the chat UI component. Typically you'll use
-    #' `$sidebar()` instead, which wraps this in a sidebar layout.
-    #'
-    #' ```r
-    #' qc <- QueryChat$new(mtcars)
-    #'
-    #' ui <- fluidPage(
-    #'   qc$ui()
-    #' )
-    #' ```
-    #'
     #' @param ... Additional arguments passed to [shinychat::chat_ui()].
-    #' @param id Optional ID for the QueryChat instance. If not provided,
-    #'   will use the ID provided at initialization. If using `$ui()` in a Shiny
-    #'   module, you'll need to provide `id = ns("your_id")` where `ns` is the
-    #'   namespacing function from [shiny::NS()].
+    #' @param id Optional ID for the QueryChat instance.
     #'
     #' @return A UI component containing the chat interface.
     ui = function(..., id = NULL) {
       check_string(id, allow_null = TRUE, allow_empty = FALSE)
 
-      # If called within another module, the UI id needs to be namespaced
-      # by that "parent" module. If called in a module *server* context, we
-      # can infer the namespace from the session, but if not, the user
-      # will need to provide it.
-      # NOTE: this isn't a problem for Python since id namespacing is handled
-      # implicitly by UI functions like shinychat.chat_ui().
       id <- id %||% namespaced_id(self$id)
 
       mod_ui(id, ..., greeting = self$greeting)
@@ -687,53 +839,20 @@ QueryChat <- R6::R6Class(
     #' @description
     #' Initialize the querychat server logic.
     #'
-    #' This method must be called within a Shiny server function. It sets up the
-    #' reactive logic for the chat interface and returns session-specific
-    #' reactive values.
-    #'
-    #' ```r
-    #' qc <- QueryChat$new(mtcars)
-    #'
-    #' server <- function(input, output, session) {
-    #'   qc_vals <- qc$server(enable_bookmarking = TRUE)
-    #'
-    #'   output$data <- renderDataTable(qc_vals$df())
-    #'   output$query <- renderText(qc_vals$sql())
-    #'   output$title <- renderText(qc_vals$title() %||% "No Query")
-    #' }
-    #' ```
-    #'
-    #' @param data_source Optional data source to use. If provided, sets the
-    #'   data_source property before initializing server logic. This is useful
-    #'   for the deferred pattern where data_source is not known at
-    #'   initialization time (e.g., when the data source depends on session-
-    #'   specific authentication).
-    #' @param client Optional chat client override for this session. Can be an
-    #'   [ellmer::Chat] object or a string (e.g., `"openai/gpt-4o"`). If provided,
-    #'   overrides the client set at initialization for this session only —
-    #'   other sessions are unaffected. This is useful when the client must be
-    #'   created within a session scope (e.g., Posit Connect managed credentials).
-    #' @param enable_bookmarking Whether to enable bookmarking for the chat
-    #'   state. Default is `FALSE`. When enabled, the chat state (including
-    #'   current query, title, and chat history) will be saved and restored
-    #'   with Shiny bookmarks. This requires that the Shiny app has bookmarking
-    #'   enabled via `shiny::enableBookmarking()` or the `enableBookmarking`
-    #'   parameter of `shiny::shinyApp()`.
+    #' @param data_source Optional data source for backward compatibility.
+    #'   If provided, calls `$add_table()` before initializing server logic.
+    #' @param client Optional chat client override for this session.
+    #' @param enable_bookmarking Whether to enable bookmarking. Default is `FALSE`.
     #' @param ... Ignored.
-    #' @param id Optional module ID for the QueryChat instance. If not provided,
-    #'   will use the ID provided at initialization. When used in Shiny modules,
-    #'   this `id` should match the `id` used in the corresponding UI function
-    #'   (i.e., `qc$ui(id = ns("your_id"))` pairs with `qc$server(id =
-    #'   "your_id")`).
+    #' @param id Optional module ID override.
     #' @param session The Shiny session object.
     #'
     #' @return A list containing session-specific reactive values and the chat
-    #'   client with the following elements:
-    #'   - `df`: Reactive expression returning the current filtered data frame
-    #'   - `sql`: Reactive value for the current SQL query string
-    #'   - `title`: Reactive value for the current title
-    #'   - `client`: The session-specific chat client instance
-    #'
+    #'   client. For single-table usage, includes `df`, `sql`, `title` directly.
+    #'   For multi-table, use `qc_vals$table("name")` to get a [TableAccessor]
+    #'   with per-table reactive state. Also includes `table_names()` to list tables.
+    #'   `current_table()` returns the name of the most recently queried table,
+    #'   or `NULL` before any query.
     server = function(
       data_source = NULL,
       client = NULL,
@@ -752,10 +871,18 @@ QueryChat <- R6::R6Class(
       }
 
       if (!is.null(data_source)) {
-        self$data_source <- data_source
+        tbl_name <- private$.deferred_table_name %||%
+          names(private$.data_sources)[[1]]
+        self$add_table(data_source, tbl_name, replace = TRUE)
       }
 
-      private$require_data_source("$server")
+      private$require_initialized("$server")
+
+      private$.server_initialized <- TRUE
+
+      if (is.null(private$.query_executor)) {
+        private$.query_executor <- build_query_executor(private$.data_sources)
+      }
 
       resolved_client_spec <- client %||% private$.client_spec
 
@@ -766,42 +893,26 @@ QueryChat <- R6::R6Class(
         )
       }
 
-      mod_server(
+      result <- mod_server(
         id %||% self$id,
-        data_source = private$.data_source,
+        data_sources = private$.data_sources,
+        executor = private$.query_executor,
         greeting = self$greeting,
         client = create_session_client,
         tools = self$tools,
         enable_bookmarking = enable_bookmarking
       )
+      result
     },
 
     #' @description
     #' Generate a welcome greeting for the chat.
     #'
-    #' By default, `QueryChat$new()` generates a greeting at the start of every
-    #' new conversation, which is convenient for getting started and
-    #' development, but also might add unnecessary latency and cost. Use this
-    #' method to generate a greeting once and save it for reuse.
-    #'
-    #' ```r
-    #' # Create QueryChat object
-    #' qc <- QueryChat$new(mtcars)
-    #'
-    #' # Generate a greeting and save it
-    #' greeting <- qc$generate_greeting()
-    #' writeLines(greeting, "mtcars_greeting.md")
-    #'
-    #' # Later, use the saved greeting
-    #' qc2 <- QueryChat$new(mtcars, greeting = "mtcars_greeting.md")
-    #' ```
-    #'
-    #' @param echo Whether to print the greeting to the console. Options are
-    #'   `"none"` (default, no output) or `"output"` (print to console).
+    #' @param echo Whether to print the greeting to the console.
     #'
     #' @return The greeting string in Markdown format.
     generate_greeting = function(echo = c("none", "output")) {
-      private$require_data_source("$generate_greeting")
+      private$require_initialized("$generate_greeting")
       chat <- private$create_session_client()
       as.character(chat$chat(GREETING_PROMPT, echo = echo))
     },
@@ -809,17 +920,13 @@ QueryChat <- R6::R6Class(
     #' @description
     #' Clean up resources associated with the data source.
     #'
-    #' This method releases any resources (e.g., database connections)
-    #' associated with the data source. Call this when you are done using the
-    #' QueryChat object to avoid resource leaks.
-    #'
-    #' Note: If `auto_cleanup` was set to `TRUE` in the constructor, this will
-    #' be called automatically when the Shiny app stops.
-    #'
     #' @return Invisibly returns `NULL`. Resources are cleaned up internally.
     cleanup = function() {
-      if (!is.null(private$.data_source)) {
-        private$.data_source$cleanup()
+      if (!is.null(private$.query_executor)) {
+        private$.query_executor$cleanup()
+      }
+      for (source in private$.data_sources) {
+        source$cleanup()
       }
       invisible(NULL)
     }
@@ -827,29 +934,27 @@ QueryChat <- R6::R6Class(
   active = list(
     #' @field system_prompt Get the system prompt.
     system_prompt = function() {
-      private$require_data_source("$system_prompt")
+      private$require_initialized("$system_prompt")
       private$.system_prompt$render(tools = self$tools)
     },
 
-    #' @field data_source Get or set the current data source. When setting,
-    #'   the value is normalized and the system prompt is rebuilt.
+    #' @field data_source Removed. Use `$add_table()` and `$remove_table()` to manage tables.
     data_source = function(value) {
       if (missing(value)) {
-        private$.data_source
+        cli::cli_abort(
+          c(
+            "The {.field $data_source} property has been removed.",
+            "i" = "Use {.code qc$add_table(df, 'name')} to add a new table."
+          )
+        )
       } else {
-        old_source <- private$.data_source
-        private$.data_source <- normalize_data_source(
-          value,
-          private$.table_name
+        cli::cli_abort(
+          c(
+            "The {.field $data_source} setter has been removed.",
+            "i" = "Use {.code qc$add_table(df, 'name')} to add a new table.",
+            "i" = "Use {.code qc$add_table(df, 'name', replace = TRUE)} to replace one."
+          )
         )
-        if (
-          !is.null(old_source) && !identical(old_source, private$.data_source)
-        ) {
-          old_source$cleanup()
-        }
-        private$auto_fill_data_description()
-        private$build_system_prompt()
-        invisible(self)
       }
     }
   )
@@ -864,70 +969,22 @@ QueryChat <- R6::R6Class(
 #' # Quick start - chat with mtcars dataset in one line
 #' querychat_app(mtcars)
 #'
-#' # Add options
-#' querychat_app(
-#'   mtcars,
-#'   greeting = "Welcome to the mtcars explorer!",
-#'   client = "openai/gpt-4o"
-#' )
-#'
-#' # Chat with a database table (table_name required)
-#' con <- DBI::dbConnect(RSQLite::SQLite(), ":memory:")
-#' DBI::dbWriteTable(con, "mtcars", mtcars)
-#' querychat_app(con, "mtcars")
-#'
-#' # Create QueryChat class object
-#' qc <- querychat(mtcars, greeting = "Welcome to the mtcars explorer!")
-#'
-#' # Run the app later
-#' qc$app()
-#'
 #' @param data_source Either a data.frame or a database connection (e.g., DBI
 #'   connection).
 #' @param table_name A string specifying the table name to use in SQL queries.
-#'   If `data_source` is a data.frame, this is the name to refer to it by in
-#'   queries (typically the variable name). If not provided, will be inferred
-#'   from the variable name for data.frame inputs. For database connections,
-#'   this parameter is required.
 #' @param ... Additional arguments (currently unused).
-#' @param id Optional module ID for the QueryChat instance. If not provided,
-#'   will be auto-generated from `table_name`. The ID is used to namespace
-#'   the Shiny module.
-#' @param greeting Optional initial message to display to users. Can be a
-#'   character string (in Markdown format) or a file path. If not provided,
-#'   a greeting will be generated at the start of each conversation using the
-#'   LLM, which adds latency and cost. Use `$generate_greeting()` to create
-#'   a greeting to save and reuse.
-#' @param client Optional chat client. Can be:
-#'   - An [ellmer::Chat] object
-#'   - A string to pass to [ellmer::chat()] (e.g., `"openai/gpt-4o"`)
-#'   - `NULL` (default): Uses the `querychat.client` option, the
-#'     `QUERYCHAT_CLIENT` environment variable, or defaults to
-#'     [ellmer::chat_openai()]
-#' @param tools Which querychat tools to include in the chat client, by
-#'   default. `"filter"` includes the tools for filtering and resetting the
-#'   dashboard and `"query"` includes the tool for executing SQL queries.
-#'   Use `tools = "filter"` when you only want the dashboard filtering tools,
-#'   or when you want to disable the querying tool entirely to prevent the
-#'   LLM from seeing any of the data in your dataset. The legacy name
-#'   `"update"` is still accepted as an alias for `"filter"`.
-#' @param data_description Optional description of the data in plain text or
-#'   Markdown. Can be a string or a file path. This provides context to the
-#'   LLM about what the data represents.
+#' @param id Optional module ID for the QueryChat instance.
+#' @param greeting Optional initial message to display to users.
+#' @param client Optional chat client.
+#' @param tools Which querychat tools to include in the chat client.
+#' @param data_description Optional description of the data.
 #' @param categorical_threshold For text columns, the maximum number of unique
 #'   values to consider as a categorical variable. Default is 20.
-#' @param extra_instructions Optional additional instructions for the chat
-#'   model in plain text or Markdown. Can be a string or a file path.
-#' @param prompt_template Optional path to or string of a custom prompt
-#'   template file. If not provided, the default querychat template will be
-#'   used. See the package prompts directory for the default template format.
+#' @param extra_instructions Optional additional instructions for the chat model.
+#' @param prompt_template Optional path to or string of a custom prompt template.
+#' @param data_dict Optional data dictionary. A path to a YAML file or a list of paths.
 #' @param cleanup Whether or not to automatically run `$cleanup()` when the
-#'   Shiny session/app stops. By default, cleanup only occurs if `QueryChat`
-#'   is created within a Shiny app. Set to `TRUE` to always clean up, or
-#'   `FALSE` to never clean up automatically.
-#'
-#'   In `querychat_app()`, in-memory databases created for data frames are
-#'   always cleaned up.
+#'   Shiny session/app stops.
 #'
 #' @return A `QueryChat` object. See [QueryChat] for available methods.
 #'
@@ -945,6 +1002,7 @@ querychat <- function(
   categorical_threshold = 20,
   extra_instructions = NULL,
   prompt_template = NULL,
+  data_dict = NULL,
   cleanup = NA
 ) {
   if (is_missing(table_name)) {
@@ -971,14 +1029,13 @@ querychat <- function(
     categorical_threshold = categorical_threshold,
     extra_instructions = extra_instructions,
     prompt_template = prompt_template,
+    data_dict = data_dict,
     cleanup = cleanup
   )
 }
 
 #' @rdname querychat-convenience
-#' @param bookmark_store The bookmarking storage method. Passed to
-#'   [shiny::enableBookmarking()]. If `"url"` or `"server"`, the chat state
-#'   (including current query) will be bookmarked. Default is `"url"`.
+#' @param bookmark_store The bookmarking storage method. Default is `"url"`.
 #' @return Invisibly returns the chat object after the app stops.
 #'
 #' @export
@@ -994,6 +1051,7 @@ querychat_app <- function(
   categorical_threshold = 20,
   extra_instructions = NULL,
   prompt_template = NULL,
+  data_dict = NULL,
   cleanup = NA,
   bookmark_store = "url"
 ) {
@@ -1034,6 +1092,7 @@ querychat_app <- function(
     categorical_threshold = categorical_threshold,
     extra_instructions = extra_instructions,
     prompt_template = prompt_template,
+    data_dict = data_dict,
     cleanup = cleanup
   )
 
@@ -1080,6 +1139,31 @@ normalize_data_source <- function(data_source, table_name) {
   )
 }
 
+normalize_data_dicts <- function(data_dict) {
+  if (is.null(data_dict)) {
+    return(list())
+  }
+  if (is.character(data_dict)) {
+    return(list(read_data_dict(data_dict)))
+  }
+  if (is.list(data_dict)) {
+    result <- vector("list", length(data_dict))
+    for (i in seq_along(data_dict)) {
+      item <- data_dict[[i]]
+      if (!is.character(item)) {
+        cli::cli_abort(
+          "Each element of {.arg data_dict} must be a file path string."
+        )
+      }
+      result[[i]] <- read_data_dict(item)
+    }
+    return(result)
+  }
+  cli::cli_abort(
+    "{.arg data_dict} must be a file path or a list of file paths."
+  )
+}
+
 namespaced_id <- function(id, session = shiny::getDefaultReactiveDomain()) {
   if (is.null(session)) {
     id
diff --git a/pkg-r/R/QueryChatSystemPrompt.R b/pkg-r/R/QueryChatSystemPrompt.R
index ba11d454b..4e530929a 100644
--- a/pkg-r/R/QueryChatSystemPrompt.R
+++ b/pkg-r/R/QueryChatSystemPrompt.R
@@ -23,55 +23,56 @@ QueryChatSystemPrompt <- R6::R6Class(
     #'   path to a file containing the extra instructions.
     extra_instructions = NULL,
 
-    #' @field schema The database schema information.
-    schema = NULL,
-
     #' @field categorical_threshold Threshold for categorical column detection.
     categorical_threshold = NULL,
 
-    #' @field data_source Reference to the data source object.
-    data_source = NULL,
+    #' @field data_sources Named list of DataSource objects.
+    data_sources = NULL,
+
+    #' @field data_dicts List of data dict lists (from [read_data_dict()]).
+    data_dicts = NULL,
 
     #' @description
     #' Create a new QueryChatSystemPrompt object.
     #'
     #' @param prompt_template Path to template file or template string.
-    #' @param data_source A DataSource object for schema access.
+    #' @param data_sources Named list of DataSource objects.
     #' @param data_description Optional path to data description file or description string.
     #' @param extra_instructions Optional path to instructions file or instructions string.
     #' @param categorical_threshold Threshold for categorical column detection (default: 10).
+    #' @param data_dicts Optional list of data dict lists (from [read_data_dict()]).
     #'
     #' @return A new `QueryChatSystemPrompt` object.
     initialize = function(
       prompt_template,
-      data_source,
+      data_sources,
       data_description = NULL,
       extra_instructions = NULL,
-      categorical_threshold = 10
+      categorical_threshold = 10,
+      data_dicts = NULL
     ) {
-      # Load template (file or string) using helper
       self$template <- read_text(prompt_template)
 
-      # Load data_description (file, string, or NULL)
       if (!is.null(data_description)) {
         self$data_description <- read_text(data_description)
       }
 
-      # Load extra_instructions (file, string, or NULL)
       if (!is.null(extra_instructions)) {
         self$extra_instructions <- read_text(extra_instructions)
       }
 
-      # Only compute schema if the template references it
-      if (grepl("\\{\\{[{#^/]?\\s*schema\\b", self$template)) {
-        self$schema <- data_source$get_schema(
-          categorical_threshold = categorical_threshold
+      self$categorical_threshold <- categorical_threshold
+      self$data_sources <- data_sources
+      self$data_dicts <- data_dicts %||% list()
+
+      if (length(data_sources) > 1 && length(self$data_dicts) == 0) {
+        cli::cli_warn(
+          c(
+            "Multiple tables registered without a {.arg data_dict}.",
+            "i" = "Providing a {.arg data_dict} with table descriptions and relationships gives the LLM better context."
+          )
         )
-      } else {
-        self$schema <- ""
       }
-      self$categorical_threshold <- categorical_threshold
-      self$data_source <- data_source
     },
 
     #' @description
@@ -82,27 +83,42 @@ QueryChatSystemPrompt <- R6::R6Class(
     #'
     #' @return A character string containing the rendered system prompt.
     render = function(tools) {
-      # Build context for whisker rendering
-      db_type <- self$data_source$get_db_type()
-      is_duck_db <- tolower(db_type) == "duckdb"
+      first_source <- self$data_sources[[1]]
+      db_type <- first_source$get_db_type()
+      has_dicts <- length(self$data_dicts) > 0
 
-      # Get semantic views description (available with DBISource for Snowflake)
       semantic_views <- ""
-      if (inherits(self$data_source, "DBISource")) {
-        semantic_views <- self$data_source$get_semantic_views_description()
+      if (inherits(first_source, "DBISource")) {
+        semantic_views <- first_source$get_semantic_views_description()
+      }
+
+      # Compute schema for backward compat with templates using {{schema}}
+      schema <- ""
+      if (grepl("\\{\\{[{#^/]?\\s*schema\\b", self$template)) {
+        schema <- first_source$get_schema(
+          categorical_threshold = self$categorical_threshold
+        )
       }
 
       context <- list(
         db_type = db_type,
-        is_duck_db = is_duck_db,
+        is_duck_db = tolower(db_type) == "duckdb",
         semantic_views = semantic_views,
-        schema = self$schema,
+        schema = schema,
+        has_data_dicts = has_dicts,
+        data_dicts = if (has_dicts) self$generate_data_dicts_yaml() else "",
+        tables_overview = if (!has_dicts) {
+          self$generate_tables_overview()
+        } else {
+          ""
+        },
         data_description = self$data_description,
         extra_instructions = self$extra_instructions,
         has_tool_update = if ("update" %in% tools) "true",
         has_tool_query = if ("query" %in% tools) "true",
         has_tool_visualize = if ("visualize" %in% tools) "true",
-        include_query_guidelines = if (length(tools) > 0) "true"
+        include_query_guidelines = if (length(tools) > 0) "true",
+        multi_table = length(self$data_sources) > 1
       )
 
       partials <- list()
@@ -119,6 +135,95 @@ QueryChatSystemPrompt <- R6::R6Class(
       }
 
       whisker::whisker.render(self$template, context, partials = partials)
+    },
+
+    #' @description
+    #' Generate a plain-text tables overview for the system prompt.
+    generate_tables_overview = function() {
+      lines <- character()
+      for (name in names(self$data_sources)) {
+        source <- self$data_sources[[name]]
+        desc <- if (is.null(self$data_description)) {
+          source$get_data_description()
+        }
+        if (nzchar(desc %||% "")) {
+          lines <- c(lines, sprintf("- %s: %s", name, desc))
+        } else {
+          lines <- c(lines, sprintf("- %s", name))
+        }
+      }
+      paste(lines, collapse = "\n")
+    },
+
+    #' @description
+    #' Generate YAML-formatted data dict blocks for the system prompt.
+    generate_data_dicts_yaml = function() {
+      check_installed("yaml")
+      blocks <- character()
+      all_claimed <- character()
+
+      for (dd in self$data_dicts) {
+        d <- data_dict_to_prompt_list(dd)
+        d$name <- NULL
+        d$description <- NULL
+
+        claimed <- intersect(names(self$data_sources), names(dd$tables))
+        all_claimed <- c(all_claimed, claimed)
+        if (!is.null(d$tables)) {
+          d$tables <- d$tables[names(d$tables) %in% names(self$data_sources)]
+          if (length(d$tables) == 0) d$tables <- NULL
+        }
+
+        escape_attr <- function(s) gsub('"', "&quot;", s, fixed = TRUE)
+        attrs <- if (!is.null(dd$name)) {
+          sprintf('name="%s"', escape_attr(dd$name))
+        } else {
+          ""
+        }
+        if (!is.null(dd$description)) {
+          attrs <- paste0(
+            attrs,
+            sprintf(' description="%s"', escape_attr(dd$description))
+          )
+        }
+        attrs <- trimws(attrs)
+
+        body <- if (length(d) > 0) {
+          yaml::as.yaml(d, column.major = FALSE)
+        } else {
+          ""
+        }
+        body <- sub("\n$", "", body)
+
+        if (nzchar(body)) {
+          blocks <- c(
+            blocks,
+            sprintf('<data-dict %s>\n%s\n</data-dict>', attrs, body)
+          )
+        } else {
+          blocks <- c(blocks, sprintf('<data-dict %s/>', attrs))
+        }
+      }
+
+      unclaimed <- setdiff(names(self$data_sources), all_claimed)
+      if (length(unclaimed) > 0) {
+        tables <- list()
+        for (name in unclaimed) {
+          desc <- if (is.null(self$data_description)) {
+            self$data_sources[[name]]$get_data_description()
+          }
+          tables[[name]] <- if (nzchar(desc %||% "")) {
+            list(description = desc)
+          } else {
+            NULL
+          }
+        }
+        yaml_str <- yaml::as.yaml(list(tables = tables), column.major = FALSE)
+        yaml_str <- sub("\n$", "", yaml_str)
+        blocks <- c(blocks, sprintf("<tables>\n%s\n</tables>", yaml_str))
+      }
+
+      paste(blocks, collapse = "\n\n")
     }
   )
 )
diff --git a/pkg-r/R/QueryExecutor.R b/pkg-r/R/QueryExecutor.R
new file mode 100644
index 000000000..1347e3d88
--- /dev/null
+++ b/pkg-r/R/QueryExecutor.R
@@ -0,0 +1,259 @@
+# Private R6 classes for multi-table query execution.
+#
+# These classes are not exported. They provide a unified interface over
+# different data source configurations (single DBI connection, shared DuckDB
+# for multiple data frames, etc.).
+
+QueryExecutor <- R6::R6Class(
+  "QueryExecutor",
+  public = list(
+    execute_query = function(query) {
+      cli::cli_abort(
+        "{.fn execute_query} must be implemented by subclass",
+        class = "not_implemented_error"
+      )
+    },
+    test_query = function(query, table_name, require_all_columns = FALSE) {
+      cli::cli_abort(
+        "{.fn test_query} must be implemented by subclass",
+        class = "not_implemented_error"
+      )
+    },
+    get_db_type = function() {
+      cli::cli_abort(
+        "{.fn get_db_type} must be implemented by subclass",
+        class = "not_implemented_error"
+      )
+    },
+    get_schema = function(
+      table_name,
+      categorical_threshold,
+      table_spec = NULL
+    ) {
+      cli::cli_abort(
+        "{.fn get_schema} must be implemented by subclass",
+        class = "not_implemented_error"
+      )
+    },
+    get_schema_result = function(
+      table_name,
+      categorical_threshold,
+      table_spec = NULL
+    ) {
+      cli::cli_abort(
+        "{.fn get_schema_result} must be implemented by subclass",
+        class = "not_implemented_error"
+      )
+    },
+    cleanup = function() {
+      invisible(NULL)
+    }
+  )
+)
+
+DuckDBExecutor <- R6::R6Class(
+  "DuckDBExecutor",
+  inherit = QueryExecutor,
+  private = list(
+    conn = NULL,
+    table_columns = list()
+  ),
+  public = list(
+    initialize = function(dataframes) {
+      check_installed("duckdb")
+
+      private$conn <- DBI::dbConnect(duckdb::duckdb(), dbdir = ":memory:")
+
+      for (name in names(dataframes)) {
+        duckdb::duckdb_register(
+          private$conn,
+          name,
+          dataframes[[name]],
+          experimental = FALSE
+        )
+      }
+
+      # Cache column names per table before lockdown
+      for (name in names(dataframes)) {
+        cols <- colnames(
+          DBI::dbGetQuery(
+            private$conn,
+            sprintf(
+              "SELECT * FROM %s WHERE 1=0",
+              DBI::dbQuoteIdentifier(private$conn, name)
+            )
+          )
+        )
+        private$table_columns[[name]] <- cols
+      }
+
+      duckdb_lock_down(private$conn)
+    },
+
+    execute_query = function(query) {
+      check_query(query)
+      DBI::dbGetQuery(private$conn, query)
+    },
+
+    test_query = function(query, table_name, require_all_columns = FALSE) {
+      check_query(query)
+
+      rs <- DBI::dbSendQuery(private$conn, query)
+      df <- DBI::dbFetch(rs, n = 1)
+      DBI::dbClearResult(rs)
+
+      if (require_all_columns) {
+        result_columns <- names(df)
+        expected <- private$table_columns[[table_name]]
+        missing_columns <- setdiff(expected, result_columns)
+
+        if (length(missing_columns) > 0) {
+          missing_list <- paste0("'", missing_columns, "'", collapse = ", ")
+          cli::cli_abort(
+            c(
+              "Query result missing required columns: {missing_list}",
+              "i" = "The query must return all original table columns (in any order)."
+            ),
+            class = "querychat_missing_columns_error"
+          )
+        }
+      }
+
+      df
+    },
+
+    get_db_type = function() "DuckDB",
+
+    get_schema = function(
+      table_name,
+      categorical_threshold,
+      table_spec = NULL
+    ) {
+      get_schema_impl(
+        private$conn,
+        table_name,
+        categorical_threshold,
+        table_spec = table_spec
+      )
+    },
+
+    get_schema_result = function(
+      table_name,
+      categorical_threshold,
+      table_spec = NULL
+    ) {
+      details <- build_column_details_impl(
+        private$conn,
+        table_name,
+        categorical_threshold,
+        table_spec = table_spec
+      )
+      list(
+        text = format_schema_from_details(
+          as.character(DBI::dbQuoteIdentifier(private$conn, table_name)),
+          details
+        ),
+        columns = details
+      )
+    },
+
+    cleanup = function() {
+      if (!is.null(private$conn) && DBI::dbIsValid(private$conn)) {
+        DBI::dbDisconnect(private$conn, shutdown = TRUE)
+      }
+      invisible(NULL)
+    }
+  )
+)
+
+DataSourceExecutor <- R6::R6Class(
+  "DataSourceExecutor",
+  inherit = QueryExecutor,
+  private = list(
+    data_sources = NULL,
+    primary = NULL
+  ),
+  public = list(
+    initialize = function(data_sources) {
+      private$data_sources <- data_sources
+      private$primary <- data_sources[[1]]
+    },
+
+    execute_query = function(query) {
+      private$primary$execute_query(query)
+    },
+
+    test_query = function(query, table_name, require_all_columns = FALSE) {
+      private$data_sources[[table_name]]$test_query(
+        query,
+        require_all_columns = require_all_columns
+      )
+    },
+
+    get_db_type = function() {
+      private$primary$get_db_type()
+    },
+
+    get_schema = function(
+      table_name,
+      categorical_threshold,
+      table_spec = NULL
+    ) {
+      private$data_sources[[table_name]]$get_schema(
+        categorical_threshold,
+        table_spec = table_spec
+      )
+    },
+
+    get_schema_result = function(
+      table_name,
+      categorical_threshold,
+      table_spec = NULL
+    ) {
+      private$data_sources[[table_name]]$get_schema_result(
+        categorical_threshold,
+        table_spec = table_spec
+      )
+    },
+
+    cleanup = function() {
+      invisible(NULL)
+    }
+  )
+)
+
+# Factory function: chooses executor type based on data source types.
+build_query_executor <- function(data_sources) {
+  if (length(data_sources) == 1) {
+    return(DataSourceExecutor$new(data_sources))
+  }
+
+  first_source <- data_sources[[1]]
+
+  if (inherits(first_source, "DataFrameSource")) {
+    dataframes <- lapply(data_sources, function(ds) ds$get_data())
+    return(DuckDBExecutor$new(dataframes))
+  }
+
+  DataSourceExecutor$new(data_sources)
+}
+
+# Validates that a new source is compatible with existing sources.
+check_source_compatibility <- function(existing_sources, new_source, new_name) {
+  if (length(existing_sources) == 0) {
+    return(invisible(NULL))
+  }
+
+  first_source <- existing_sources[[1]]
+
+  if (!identical(class(new_source), class(first_source))) {
+    cli::cli_abort(
+      c(
+        "Cannot add {.cls {class(new_source)[1]}} table {.val {new_name}}: all tables must be the same type.",
+        "i" = "Existing tables use {.cls {class(first_source)[1]}}."
+      )
+    )
+  }
+
+  invisible(NULL)
+}
diff --git a/pkg-r/R/TableAccessor.R b/pkg-r/R/TableAccessor.R
new file mode 100644
index 000000000..2690a5520
--- /dev/null
+++ b/pkg-r/R/TableAccessor.R
@@ -0,0 +1,43 @@
+#' Table Accessor
+#'
+#' @description
+#' Accessor for a specific table's data source and per-table reactive state.
+#' Returned by the server return value's `$table("name")` method.
+#'
+#' @export
+#' @keywords internal
+TableAccessor <- R6::R6Class(
+  "TableAccessor",
+  private = list(
+    .table_name = NULL,
+    .data_source = NULL,
+    .state = NULL
+  ),
+  public = list(
+    #' @description Create a new TableAccessor.
+    #' @param table_name The name of the table.
+    #' @param data_source The DataSource for this table.
+    #' @param state List of per-table reactive state (`sql`, `title`, `df`).
+    initialize = function(table_name, data_source, state) {
+      private$.table_name <- table_name
+      private$.data_source <- data_source
+      private$.state <- state
+    },
+
+    #' @description Return the current filtered data for this table.
+    df = function() private$.state$df(),
+
+    #' @description Return the current SQL filter for this table.
+    sql = function() private$.state$sql(),
+
+    #' @description Return the current filter title for this table.
+    title = function() private$.state$title()
+  ),
+  active = list(
+    #' @field table_name The name of this table.
+    table_name = function() private$.table_name,
+
+    #' @field data_source The DataSource for this table.
+    data_source = function() private$.data_source
+  )
+)
diff --git a/pkg-r/R/TblSqlSource.R b/pkg-r/R/TblSqlSource.R
index 51e2d0078..7ab55e7ac 100644
--- a/pkg-r/R/TblSqlSource.R
+++ b/pkg-r/R/TblSqlSource.R
@@ -103,13 +103,35 @@ TblSqlSource <- R6::R6Class(
     #' @param categorical_threshold Maximum number of unique values for a text
     #'   column to be considered categorical
     #' @return A string containing schema information formatted for LLM prompts
-    get_schema = function(categorical_threshold = 20) {
+    get_schema = function(categorical_threshold = 20, table_spec = NULL) {
       get_schema_impl(
         private$conn,
         self$table_name,
         categorical_threshold,
         columns = colnames(private$tbl),
-        prep_query = self$prep_query
+        prep_query = self$prep_query,
+        table_spec = table_spec
+      )
+    },
+
+    get_schema_result = function(
+      categorical_threshold = 20,
+      table_spec = NULL
+    ) {
+      details <- build_column_details_impl(
+        private$conn,
+        self$table_name,
+        categorical_threshold,
+        columns = colnames(private$tbl),
+        prep_query = self$prep_query,
+        table_spec = table_spec
+      )
+      list(
+        text = format_schema_from_details(
+          as.character(DBI::dbQuoteIdentifier(private$conn, self$table_name)),
+          details
+        ),
+        columns = details
       )
     },
 
diff --git a/pkg-r/R/querychat-package.R b/pkg-r/R/querychat-package.R
index cc9656341..e5a51df40 100644
--- a/pkg-r/R/querychat-package.R
+++ b/pkg-r/R/querychat-package.R
@@ -76,6 +76,10 @@ NULL
 #' @rawNamespace if (getRversion() < "4.3.0") importFrom("S7", "@")
 NULL
 
+.onLoad <- function(libname, pkgname) {
+  rlang::run_on_load()
+}
+
 release_bullets <- function() {
   c(
     "Run `staticimports::import()` to update static imports",
diff --git a/pkg-r/R/querychat_module.R b/pkg-r/R/querychat_module.R
index ef668448b..efc9904b5 100644
--- a/pkg-r/R/querychat_module.R
+++ b/pkg-r/R/querychat_module.R
@@ -38,15 +38,15 @@ mod_ui <- function(
 # Main module server function
 mod_server <- function(
   id,
-  data_source,
+  data_sources,
+  executor,
   greeting,
   client,
   tools,
   enable_bookmarking = FALSE
 ) {
   shiny::moduleServer(id, function(input, output, session) {
-    current_title <- shiny::reactiveVal(NULL, label = "current_title")
-    current_query <- shiny::reactiveVal(NULL, label = "current_query")
+    current_table_val <- shiny::reactiveVal(NULL, label = "current_table")
     # Holds a generated greeting so it can be saved and restored on bookmark.
     # Static greetings live in the UI (chat_ui(greeting=)) and persist already.
     # Workaround for posit-dev/shinychat#253: shinychat does not bookmark
@@ -54,9 +54,32 @@ mod_server <- function(
     # the last_turn() capture below, and the greeting handling in
     # onBookmark/onRestore can be dropped (and the shinychat minimum bumped).
     current_greeting <- shiny::reactiveVal(NULL, label = "current_greeting")
-    filtered_df <- shiny::reactive(label = "filtered_df", {
-      data_source$execute_query(query = current_query())
-    })
+
+    # Per-table reactive state
+    tables <- list()
+    for (name in names(data_sources)) {
+      local({
+        tbl_name <- name
+        sql_val <- shiny::reactiveVal(NULL, label = paste0(tbl_name, "_sql"))
+        title_val <- shiny::reactiveVal(
+          NULL,
+          label = paste0(tbl_name, "_title")
+        )
+        df_val <- shiny::reactive(label = paste0(tbl_name, "_df"), {
+          q <- sql_val()
+          if (is.null(q)) {
+            data_sources[[tbl_name]]$get_data()
+          } else {
+            executor$execute_query(q)
+          }
+        })
+        tables[[tbl_name]] <<- list(
+          sql = sql_val,
+          title = title_val,
+          df = df_val
+        )
+      })
+    }
 
     append_output <- function(...) {
       txt <- paste0(...)
@@ -69,19 +92,26 @@ mod_server <- function(
       )
     }
 
-    update_dashboard <- function(query, title) {
+    update_dashboard <- function(query, title, table) {
       if (!is.null(query)) {
-        current_query(query)
+        tables[[table]]$sql(query)
       }
       if (!is.null(title)) {
-        current_title(title)
+        tables[[table]]$title(title)
       }
+      current_table_val(table)
     }
 
-    reset_query <- function() {
-      current_query(NULL)
-      current_title(NULL)
-      querychat_tool_result(action = "reset")
+    reset_query <- function(table) {
+      tables[[table]]$sql(NULL)
+      tables[[table]]$title(NULL)
+      current_table_val(table)
+      querychat_tool_result(
+        executor,
+        query = NULL,
+        action = "reset",
+        table_name = table
+      )
     }
 
     # Non-reactive bookkeeping for bookmark save/restore of viz widgets
@@ -170,17 +200,34 @@ mod_server <- function(
     })
 
     shiny::observeEvent(input$chat_update, label = "on_chat_update", {
-      current_query(input$chat_update$query)
-      current_title(input$chat_update$title)
+      tbl <- input$chat_update$table
+      if (!is.null(tbl) && tbl %in% names(tables)) {
+        q <- input$chat_update$query
+        ttl <- input$chat_update$title
+        tables[[tbl]]$sql(if (nzchar(q %||% "")) q else NULL)
+        tables[[tbl]]$title(if (nzchar(ttl %||% "")) ttl else NULL)
+        current_table_val(tbl)
+      }
     })
 
     if (enable_bookmarking) {
-      shinychat::chat_restore("chat", chat, session = session)
+      shinychat::chat_restore(
+        "chat",
+        chat,
+        restore_ui = FALSE,
+        session = session
+      )
       shiny::setBookmarkExclude("chat_update", session = session)
 
       shiny::onBookmark(function(state) {
-        state$values$querychat_sql <- current_query()
-        state$values$querychat_title <- current_title()
+        table_states <- list()
+        for (name in names(tables)) {
+          table_states[[name]] <- list(
+            sql = tables[[name]]$sql(),
+            title = tables[[name]]$title()
+          )
+        }
+        state$values$querychat_tables <- table_states
         if (!is.null(current_greeting())) {
           state$values$querychat_greeting <- current_greeting()
         }
@@ -190,11 +237,21 @@ mod_server <- function(
       })
 
       shiny::onRestore(function(state) {
-        if (!is.null(state$values$querychat_sql)) {
-          current_query(state$values$querychat_sql)
-        }
-        if (!is.null(state$values$querychat_title)) {
-          current_title(state$values$querychat_title)
+        if (!is.null(state$values$querychat_tables)) {
+          last_restored <- NULL
+          for (name in names(state$values$querychat_tables)) {
+            tbl_state <- state$values$querychat_tables[[name]]
+            if (!is.null(tbl_state$sql)) {
+              tables[[name]]$sql(tbl_state$sql)
+              last_restored <- name
+            }
+            if (!is.null(tbl_state$title)) {
+              tables[[name]]$title(tbl_state$title)
+            }
+          }
+          if (!is.null(last_restored)) {
+            current_table_val(last_restored)
+          }
         }
         if (!is.null(state$values$querychat_greeting)) {
           current_greeting(state$values$querychat_greeting)
@@ -209,7 +266,7 @@ mod_server <- function(
         }
         if (!is.null(state$values$querychat_viz_widgets)) {
           restored <- restore_viz_widgets(
-            data_source,
+            executor,
             state$values$querychat_viz_widgets,
             session
           )
@@ -218,12 +275,50 @@ mod_server <- function(
       })
     }
 
-    list(
-      client = chat,
-      sql = current_query,
-      title = current_title,
-      df = filtered_df
-    )
+    table_fn <- function(name) {
+      if (!name %in% names(tables)) {
+        available <- paste0("'", names(tables), "'", collapse = ", ")
+        cli::cli_abort(
+          "Table {.val {name}} not found. Available: {available}"
+        )
+      }
+      TableAccessor$new(name, data_sources[[name]], state = tables[[name]])
+    }
+
+    table_names_fn <- function() names(tables)
+
+    # Backward compat: for single-table, expose sql/title/df directly
+    if (length(data_sources) == 1) {
+      first <- tables[[1]]
+      list(
+        client = chat,
+        sql = first$sql,
+        title = first$title,
+        df = first$df,
+        table = table_fn,
+        table_names = table_names_fn,
+        current_table = current_table_val,
+        .tables = tables
+      )
+    } else {
+      single_table_error <- function(method) {
+        function(...) {
+          cli::cli_abort(
+            "Multiple tables registered. Use {.code qc_vals$table('name')${method}()} instead."
+          )
+        }
+      }
+      list(
+        client = chat,
+        sql = single_table_error("sql"),
+        title = single_table_error("title"),
+        df = single_table_error("df"),
+        table = table_fn,
+        table_names = table_names_fn,
+        current_table = current_table_val,
+        .tables = tables
+      )
+    }
   })
 }
 
@@ -234,7 +329,7 @@ GREETING_PROMPT <- paste(
   "using the suggestion card format from your instructions."
 )
 
-restore_viz_widgets <- function(data_source, saved_widgets, session) {
+restore_viz_widgets <- function(executor, saved_widgets, session) {
   if (!rlang::is_installed("ggsql")) {
     warning(
       "ggsql is not installed; skipping restoration of visualization widgets.",
@@ -248,7 +343,7 @@ restore_viz_widgets <- function(data_source, saved_widgets, session) {
     tryCatch(
       {
         validated <- ggsql::ggsql_validate(entry$ggsql)
-        spec <- execute_ggsql(data_source, validated)
+        spec <- execute_ggsql(executor, validated)
         session$output[[entry$widget_id]] <- ggsql::renderGgsql(spec)
         restored <- c(restored, list(entry))
       },
diff --git a/pkg-r/R/querychat_tools.R b/pkg-r/R/querychat_tools.R
index 26a3a261d..927f50443 100644
--- a/pkg-r/R/querychat_tools.R
+++ b/pkg-r/R/querychat_tools.R
@@ -1,34 +1,107 @@
+#' @noRd
+GetSchemaResult <- S7::new_class(
+  "GetSchemaResult",
+  parent = ellmer::ContentToolResult,
+  properties = list(
+    table_name = S7::class_character,
+    columns_json = S7::new_property(S7::class_character, default = "")
+  )
+)
+
+#' @importFrom shinychat contents_shinychat
+rlang::on_load({
+  S7::method(contents_shinychat, GetSchemaResult) <- get_schema_result_display
+
+  orig_request_contents <- S7::method(
+    contents_shinychat,
+    ellmer::ContentToolRequest
+  )
+  S7::method(contents_shinychat, ellmer::ContentToolRequest) <- function(
+    content
+  ) {
+    if (identical(content@name, "querychat_get_schema")) {
+      return(NULL)
+    }
+    orig_request_contents(content)
+  }
+})
+
+tool_get_schema <- function(
+  data_dicts,
+  executor,
+  table_names,
+  categorical_threshold
+) {
+  ellmer::tool(
+    function(table_name) {
+      if (!table_name %in% table_names) {
+        available <- paste0("'", table_names, "'", collapse = ", ")
+        cli::cli_abort(
+          "Table {.val {table_name}} not found. Available: {available}"
+        )
+      }
+      table_spec <- NULL
+      for (dd in data_dicts) {
+        if (!is.null(dd[["tables"]][[table_name]])) {
+          table_spec <- dd[["tables"]][[table_name]]
+          break
+        }
+      }
+      schema_result <- executor$get_schema_result(
+        table_name,
+        categorical_threshold,
+        table_spec = table_spec
+      )
+      columns_json <- jsonlite::toJSON(schema_result$columns, auto_unbox = TRUE)
+      GetSchemaResult(
+        value = schema_result$text,
+        table_name = table_name,
+        columns_json = as.character(columns_json)
+      )
+    },
+    name = "querychat_get_schema",
+    description = interpolate_package("tool-get-schema.md"),
+    arguments = list(
+      table_name = ellmer::type_string(
+        "The name of the table to retrieve schema for."
+      )
+    ),
+    annotations = ellmer::tool_annotations(title = "Get Schema")
+  )
+}
+
 # Modifies the data presented in the data dashboard, based on the given SQL
 # query, and also updates the title.
 # @param query A SQL query; must be a SELECT statement.
 # @param title A title to display at the top of the data dashboard,
 #   summarizing the intent of the SQL query.
 tool_update_dashboard <- function(
-  data_source,
-  update_fn = function(query, title) {}
+  executor,
+  table_names,
+  update_fn = function(query, title, table) {}
 ) {
-  check_data_source(data_source)
-
   check_function(update_fn)
-  has_args <- intersect(fn_fmls_names(update_fn), c("query", "title"))
-  if (length(has_args) != 2) {
-    missing_args <- setdiff(c("query", "title"), has_args)
+  has_args <- intersect(fn_fmls_names(update_fn), c("query", "title", "table"))
+  if (length(has_args) != 3) {
+    missing_args <- setdiff(c("query", "title", "table"), has_args)
     cli::cli_abort(
       c(
-        "{.arg update_fn} must accept at least two named arguments: {.val query} and {.val title}.",
+        "{.arg update_fn} must accept at least three named arguments: {.val query}, {.val title}, and {.val table}.",
         "x" = "{.val {missing_args}} argument{?s} {?was/were} missing."
       )
     )
   }
 
-  db_type <- data_source$get_db_type()
+  db_type <- executor$get_db_type()
+  multi_table <- length(table_names) > 1
 
   ellmer::tool(
-    tool_update_dashboard_impl(data_source, update_fn),
+    tool_update_dashboard_impl(executor, table_names, update_fn),
     name = "querychat_update_dashboard",
     description = interpolate_package(
       "tool-update-dashboard.md",
-      db_type = db_type
+      db_type = db_type,
+      multi_table = multi_table
     ),
     arguments = list(
       query = ellmer::type_string(
@@ -39,6 +112,9 @@ tool_update_dashboard <- function(
       ),
       title = ellmer::type_string(
         "A brief title for display purposes, summarizing the intent of the SQL query."
+      ),
+      table = ellmer::type_string(
+        "The name of the table to update the dashboard for."
       )
     ),
     annotations = ellmer::tool_annotations(
@@ -48,34 +124,50 @@ tool_update_dashboard <- function(
   )
 }
 
-tool_update_dashboard_impl <- function(data_source, update_fn) {
-  force(data_source)
+tool_update_dashboard_impl <- function(executor, table_names, update_fn) {
+  force(executor)
+  force(table_names)
 
-  function(query, title) {
+  function(query, title, table) {
     res <- querychat_tool_result(
-      data_source,
+      executor,
       query = query,
       title = title,
-      action = "update"
+      action = "update",
+      table_name = table
     )
 
     if (is.null(res@error)) {
-      update_fn(query, title)
+      update_fn(query, title, table)
     }
 
     res
   }
 }
 
-
-tool_reset_dashboard <- function(reset_fn = identity) {
+tool_reset_dashboard <- function(
+  reset_fn = function(table) {},
+  table_names
+) {
   check_function(reset_fn)
 
   ellmer::tool(
-    reset_fn,
+    function(table) {
+      if (!table %in% table_names) {
+        available <- paste0("'", table_names, "'", collapse = ", ")
+        cli::cli_abort(
+          "Table {.val {table}} not found. Available: {available}"
+        )
+      }
+      reset_fn(table)
+    },
     name = "querychat_reset_dashboard",
     description = interpolate_package("tool-reset-dashboard.md"),
-    arguments = list(),
+    arguments = list(
+      table = ellmer::type_string(
+        "The name of the table to reset the dashboard for."
+      )
+    ),
     annotations = ellmer::tool_annotations(
       title = "Reset Dashboard",
       icon = '<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 16 16" class="bi bi-arrow-counterclockwise " style="height:1em;width:1em;fill:currentColor;vertical-align:-0.125em;" aria-hidden="true" role="img" ><path fill-rule="evenodd" d="M8 3a5 5 0 1 1-4.546 2.914.5.5 0 0 0-.908-.417A6 6 0 1 0 8 2v1z"></path><path d="M8 4.466V.534a.25.25 0 0 0-.41-.192L5.23 2.308a.25.25 0 0 0 0 .384l2.36 1.966A.25.25 0 0 0 8 4.466z"></path></svg>'
@@ -86,22 +178,24 @@ tool_reset_dashboard <- function(reset_fn = identity) {
 # Perform a SQL query on the data, and return the results as JSON.
 # @param query A SQL query; must be a SELECT statement.
 # @return The results of the query as a data frame.
-tool_query <- function(data_source) {
-  check_data_source(data_source)
-
-  db_type <- data_source$get_db_type()
+tool_query <- function(executor, multi_table = FALSE) {
+  db_type <- executor$get_db_type()
 
   ellmer::tool(
     function(query, collapsed = NULL, `_intent` = "") {
       querychat_tool_result(
-        data_source,
+        executor,
         query,
         action = "query",
         collapsed = collapsed
       )
     },
     name = "querychat_query",
-    description = interpolate_package("tool-query.md", db_type = db_type),
+    description = interpolate_package(
+      "tool-query.md",
+      db_type = db_type,
+      multi_table = multi_table
+    ),
     arguments = list(
       query = ellmer::type_string(
         ellmer::interpolate(
@@ -141,10 +235,12 @@ querychat_tool_details_option <- function() {
   valid_settings <- c("expanded", "collapsed", "default")
 
   if (!setting %in% valid_settings) {
-    cli::cli_warn(c(
-      "Invalid value for {.code querychat.tool_details} option or {.envvar QUERYCHAT_TOOL_DETAILS} environment variable: {.val {setting}}",
-      "i" = "Must be one of: {.or {.val {valid_settings}}}"
-    ))
+    cli::cli_warn(
+      c(
+        "Invalid value for {.code querychat.tool_details} option or {.envvar QUERYCHAT_TOOL_DETAILS} environment variable: {.val {setting}}",
+        "i" = "Must be one of: {.or {.val {valid_settings}}}"
+      )
+    )
     return(NULL)
   }
 
@@ -167,10 +263,11 @@ querychat_tool_starts_open <- function(action) {
 }
 
 querychat_tool_result <- function(
-  data_source,
+  executor,
   query,
   title = NULL,
   action = "update",
+  table_name = NULL,
   collapsed = NULL
 ) {
   action <- arg_match(action, c("update", "query", "reset"))
@@ -184,10 +281,14 @@ querychat_tool_result <- function(
     switch(
       action,
       update = {
-        data_source$test_query(query, require_all_columns = TRUE)
+        executor$test_query(
+          query,
+          table_name = table_name,
+          require_all_columns = TRUE
+        )
         NULL
       },
-      query = data_source$execute_query(query),
+      query = executor$execute_query(query),
       reset = "The dashboard has been reset to show all data."
     ),
     error = function(err) err
@@ -214,6 +315,7 @@ querychat_tool_result <- function(
         class = "btn btn-outline-primary btn-sm float-end mt-3 querychat-update-dashboard-btn",
         "data-query" = query,
         "data-title" = title,
+        "data-table" = table_name,
         switch(action, update = "Apply Filter", reset = "Reset Filter")
       )
     )
@@ -250,3 +352,26 @@ querychat_tool_result <- function(
     )
   )
 }
+
+schema_dep <- function() {
+  htmltools::htmlDependency(
+    name = "querychat-schema-display",
+    version = utils::packageVersion("querychat"),
+    package = "querychat",
+    src = "htmldep",
+    script = "schema-display.js"
+  )
+}
+
+get_schema_result_display <- function(content) {
+  htmltools::tagList(
+    htmltools::tags$span(
+      class = "qc-schema-collector",
+      `data-table` = content@table_name,
+      `data-schema` = content@value,
+      `data-schema-json` = content@columns_json,
+      style = "display:none"
+    ),
+    schema_dep()
+  )
+}
diff --git a/pkg-r/R/querychat_viz.R b/pkg-r/R/querychat_viz.R
index 980dc96ad..a1b084fe8 100644
--- a/pkg-r/R/querychat_viz.R
+++ b/pkg-r/R/querychat_viz.R
@@ -1,16 +1,15 @@
 tool_visualize_dashboard <- function(
-  data_source,
+  executor,
   session,
   update_fn = function(data) {},
   has_tool_query = FALSE
 ) {
-  check_data_source(data_source)
   check_function(update_fn)
 
-  db_type <- data_source$get_db_type()
+  db_type <- executor$get_db_type()
 
   ellmer::tool(
-    tool_visualize_impl(data_source, session, update_fn),
+    tool_visualize_impl(executor, session, update_fn),
     name = "querychat_visualize",
     description = render_viz_tool_description(
       db_type = db_type,
@@ -34,13 +33,13 @@ tool_visualize_dashboard <- function(
   )
 }
 
-tool_visualize_impl <- function(data_source, session, update_fn) {
-  force(data_source)
+tool_visualize_impl <- function(executor, session, update_fn) {
+  force(executor)
   force(session)
   force(update_fn)
 
   function(ggsql, title) {
-    visualize_result(data_source, session, update_fn, ggsql, title)
+    visualize_result(executor, session, update_fn, ggsql, title)
   }
 }
 
@@ -52,7 +51,7 @@ random_hex <- function(n_bytes = 8) {
 }
 
 visualize_result <- function(
-  data_source,
+  executor,
   session,
   update_fn,
   ggsql_str,
@@ -73,7 +72,7 @@ visualize_result <- function(
     rlang::abort(collapse_validation_errors(validated))
   }
 
-  spec <- execute_ggsql(data_source, validated)
+  spec <- execute_ggsql(executor, validated)
 
   widget_id <- paste0("querychat_viz_", random_hex())
 
@@ -89,13 +88,15 @@ visualize_result <- function(
   } else {
     # Non-Shiny usage: print the Spec to display via the interactive viewer
     print(spec)
-    update_fn(list(ggsql = ggsql_str, title = title, widget_id = widget_id))
-    return(ellmer::ContentToolResult(
-      value = sprintf(
-        "Chart displayed%s.",
-        if (nzchar(title)) sprintf(" with title '%s'", title) else ""
+    update_fn(list(ggsql = ggsql_str, title = title, widget_id = widget_id)) # nolint
+    return(
+      ellmer::ContentToolResult(
+        value = sprintf(
+          "Chart displayed%s.",
+          if (nzchar(title)) sprintf(" with title '%s'", title) else ""
+        )
       )
-    ))
+    )
   }
 
   # PNG snapshot for LLM feedback (best-effort; requires V8 + rsvg)
@@ -107,12 +108,14 @@ visualize_result <- function(
       ellmer::content_image_file(png_file)
     },
     error = function(e) {
-      cli::cli_warn(c(
-        "Unable to render PNG preview for the visualization card.",
-        "i" = "The interactive chart will still render, but the LLM will not receive the static image preview for this visualization.",
-        "i" = "PNG preview generation requires optional dependencies used by {.fn ggsql::ggsql_save}, typically {.pkg V8} and {.pkg rsvg}.",
-        "x" = "Underlying error: {.msg {conditionMessage(e)}}"
-      ))
+      cli::cli_warn(
+        c(
+          "Unable to render PNG preview for the visualization card.",
+          "i" = "The interactive chart will still render, but the LLM will not receive the static image preview for this visualization.",
+          "i" = "PNG preview generation requires optional dependencies used by {.fn ggsql::ggsql_save}, typically {.pkg V8} and {.pkg rsvg}.",
+          "x" = "Underlying error: {.msg {conditionMessage(e)}}"
+        )
+      )
       NULL
     }
   )
@@ -279,19 +282,19 @@ render_viz_tool_description <- function(db_type, has_tool_query = FALSE) {
   )
 }
 
-#' Execute a pre-validated ggsql query against a DataSource
+#' Execute a pre-validated ggsql query against an executor
 #'
-#' Executes the SQL portion through a DataSource (preserving database pushdown),
+#' Executes the SQL portion through an executor (preserving database pushdown),
 #' then feeds the result into a ggsql DuckDB reader to produce a Spec.
 #'
-#' @param data_source A querychat DataSource R6 object.
+#' @param executor A querychat QueryExecutor R6 object.
 #' @param validated A pre-validated ggsql query (from `ggsql::ggsql_validate()`).
 #'   Must be a list with `$sql` and `$visual` fields.
 #'
 #' @return A `ggsql::Spec` R6 object (the writer-independent plot specification).
 #'
 #' @keywords internal
-execute_ggsql <- function(data_source, validated) {
+execute_ggsql <- function(executor, validated) {
   rlang::check_installed("ggsql", reason = "for visualization support.")
 
   visual <- validated$visual
@@ -302,7 +305,7 @@ execute_ggsql <- function(data_source, validated) {
     )
   }
 
-  df <- data_source$execute_query(validated$sql)
+  df <- executor$execute_query(validated$sql)
 
   if (inherits(df, "tbl_sql")) {
     # Materialize the query for ggsql, {dplyr} guaranteed by TblSqlSource
diff --git a/pkg-r/R/utils-check.R b/pkg-r/R/utils-check.R
index d9ff53f81..966df62d7 100644
--- a/pkg-r/R/utils-check.R
+++ b/pkg-r/R/utils-check.R
@@ -12,7 +12,6 @@ check_data_source <- function(
   }
 }
 
-
 # SQL table name validation ----------------------------------------------
 
 #' Check SQL table name validity
@@ -77,7 +76,6 @@ sanitize_table_name <- function(x) {
   out
 }
 
-
 # SQL query validation --------------------------------------------------------
 
 #' Check SQL query for disallowed operations
diff --git a/pkg-r/R/utils-ellmer.R b/pkg-r/R/utils-ellmer.R
index aadbe8953..c8088bbd4 100644
--- a/pkg-r/R/utils-ellmer.R
+++ b/pkg-r/R/utils-ellmer.R
@@ -1,5 +1,4 @@
-interpolate_package <- function(path, ..., .envir = parent.frame()) {
-  # This helper replicates ellmer::interpolate_package() to work with load_all()
+interpolate_package <- function(path, ...) {
   stopifnot(
     "`path` must be a single string" = is.character(path),
     "`path` must be a single string" = length(path) == 1
@@ -11,10 +10,10 @@ interpolate_package <- function(path, ..., .envir = parent.frame()) {
     "`path` does not exist" = file.exists(path)
   )
 
-  ellmer::interpolate_file(path, ..., .envir = .envir)
+  template <- read_utf8(path)
+  whisker::whisker.render(template, list(...))
 }
 
-
 as_querychat_client <- function(client = NULL) {
   if (is.null(client)) {
     client <- querychat_client_option()
diff --git a/pkg-r/README.md b/pkg-r/README.md
index ca99f97fb..740cbad3a 100644
--- a/pkg-r/README.md
+++ b/pkg-r/README.md
@@ -59,8 +59,7 @@ With the [visualization tool](https://posit-dev.github.io/querychat/r/articles/v
 
 ## Custom apps
 
-querychat is designed to be highly extensible -- it provides programmatic access to the chat interface, the filtered/sorted data frame, SQL queries, and more.
-This makes it easy to build custom web apps that leverage natural language interaction with your data.
+querychat is designed to be highly extensible — it provides programmatic access to the chat interface, the filtered/sorted data frame, SQL queries, and more. You can register [multiple related tables](https://posit-dev.github.io/querychat/r/articles/build.html#multiple-tables) for cross-table queries and joins, and connect all of it to your own visualizations and layouts.
 For example, [here](https://github.com/posit-conf-2025/llm/blob/main/_solutions/25_querychat/25_querychat_02-end-app.R)'s a bespoke app for exploring Airbnb listings in Ashville, NC:
 
 ![](man/figures/airbnb.png){alt="A custom app for exploring Airbnb listings, powered by querychat." class="shadow rounded mb-3"}
@@ -69,9 +68,9 @@ To learn more, see [Build an app](https://posit-dev.github.io/querychat/r/articl
 
 ## How it works
 
-querychat uses LLMs to translate natural language into SQL queries. Models of all sizes, from small ones you can run locally to large frontier models from major AI providers, are remarkably effective at this task. But even the best models need to understand your data's overall structure to perform well.
+querychat uses LLMs to translate natural language into SQL queries. Models of all sizes, from small ones you can run locally to large frontier models from major AI providers, are remarkably effective at this task. But even the best models need to understand your data's structure to perform well.
 
-To address this, querychat includes schema metadata -- column names, types, ranges, categorical values -- in the LLM's [system prompt](https://posit-dev.github.io/querychat/r/articles/context.html). Importantly, querychat **does not** send raw data to the LLM; it shares only enough structural information for the model to generate accurate queries. When the LLM produces a query, querychat executes it in a SQL database (DuckDB[^duckdb], by default) to obtain precise results.
+To address this, querychat provides a schema retrieval [tool](https://posit-dev.github.io/querychat/r/articles/tools.html#schema-retrieval) that the LLM calls on demand to learn about table structure — column names, types, ranges, and categorical values. You can further improve results by providing a [data dictionary](https://posit-dev.github.io/querychat/r/articles/context.html#data-dictionary) with column descriptions, table relationships, and domain terminology. Importantly, querychat **does not** send raw data to the LLM; it shares only enough structural information for the model to generate accurate queries. When the LLM produces a query, querychat executes it in a SQL database (DuckDB[^duckdb], by default) to obtain precise results.
 
 This design makes querychat reliable, safe, and reproducible:
 
diff --git a/pkg-r/inst/examples-shiny/11-multi-table-nutrition/app.R b/pkg-r/inst/examples-shiny/11-multi-table-nutrition/app.R
new file mode 100644
index 000000000..556c5f79f
--- /dev/null
+++ b/pkg-r/inst/examples-shiny/11-multi-table-nutrition/app.R
@@ -0,0 +1,257 @@
+library(shiny)
+library(bslib)
+library(querychat)
+library(arrow)
+library(dplyr)
+library(tidyr)
+library(plotly)
+library(DT)
+
+# ── Data ──────────────────────────────────────────────────────────────────────
+
+data_dir <- file.path("data", "foodbank")
+
+foods <- read_parquet(file.path(data_dir, "foods.parquet"))
+food_categories <- read_parquet(file.path(data_dir, "food_categories.parquet"))
+nutrients <- read_parquet(file.path(data_dir, "nutrients.parquet"))
+food_nutrients <- read_parquet(file.path(data_dir, "food_nutrients.parquet"))
+food_portions <- read_parquet(file.path(data_dir, "food_portions.parquet"))
+measure_units <- read_parquet(file.path(data_dir, "measure_units.parquet"))
+
+nutrient_id_to_col <- c(
+  "1008" = "energy_kcal",
+  "1003" = "protein_g",
+  "1004" = "fat_g",
+  "1005" = "carbs_g",
+  "1079" = "fiber_g",
+  "1063" = "sugars_g",
+  "1258" = "sat_fat_g",
+  "1087" = "calcium_mg",
+  "1089" = "iron_mg",
+  "1093" = "sodium_mg",
+  "1162" = "vitamin_c_mg",
+  "1092" = "potassium_mg"
+)
+
+wide_nutrients <- food_nutrients |>
+  mutate(col = nutrient_id_to_col[as.character(nutrient_id)]) |>
+  filter(!is.na(col)) |>
+  select(fdc_id, col, amount) |>
+  pivot_wider(names_from = col, values_from = amount)
+
+foods_wide <- foods |>
+  left_join(
+    food_categories |>
+      select(id, description) |>
+      rename(category = description),
+    by = c("food_category_id" = "id")
+  ) |>
+  left_join(wide_nutrients, by = "fdc_id")
+
+# ── QueryChat ─────────────────────────────────────────────────────────────────
+
+greeting <- paste0(
+  "## USDA Foundation Foods Explorer\n\n",
+  "Real nutrition data for **436 foods** across 19 categories — ",
+  "macronutrients, minerals, vitamins, and serving sizes.\n\n",
+  "**Filter this view**\n\n",
+  '<span class="suggestion">Show only foods where fiber exceeds sugar</span>\n\n',
+  '<span class="suggestion">High-protein, low-fat foods: protein > 20g and fat < 5g per 100g</span>\n\n',
+  '<span class="suggestion">Foods higher in potassium than sodium</span>\n\n',
+  "**Dig deeper**\n\n",
+  '<span class="suggestion">Which fruits or vegetables beat whole milk for calcium?</span>\n\n',
+  '<span class="suggestion">Rank all foods by protein per calorie</span>\n\n',
+  '<span class="suggestion">For 1 cup of oats, how much protein and fiber am I getting?</span>\n\n'
+)
+
+qc <- QueryChat$new(
+  foods,
+  "foods",
+  data_dict = "nutrition-data-dict.yaml",
+  greeting = greeting
+)
+qc$add_table(food_categories, "food_categories")
+qc$add_table(nutrients, "nutrients")
+qc$add_table(food_nutrients, "food_nutrients")
+qc$add_table(food_portions, "food_portions")
+qc$add_table(measure_units, "measure_units")
+
+# ── App ───────────────────────────────────────────────────────────────────────
+
+ui <- page_navbar(
+  title = "USDA Foundation Foods",
+  sidebar = sidebar(
+    qc$ui(),
+    width = 400,
+    fillable = TRUE,
+    class = "querychat-sidebar"
+  ),
+  nav_panel(
+    "Overview",
+    layout_columns(
+      value_box(
+        "Foods",
+        textOutput("n_foods"),
+        showcase = bsicons::bs_icon("grid"),
+        theme = "primary"
+      ),
+      value_box(
+        "Avg Protein",
+        textOutput("avg_protein"),
+        showcase = bsicons::bs_icon("egg-fried"),
+        theme = "success"
+      ),
+      value_box(
+        "Avg Fiber",
+        textOutput("avg_fiber"),
+        showcase = bsicons::bs_icon("tree"),
+        theme = "info"
+      ),
+      value_box(
+        "Avg Calories",
+        textOutput("avg_calories"),
+        showcase = bsicons::bs_icon("fire"),
+        theme = "warning"
+      ),
+      col_widths = c(3, 3, 3, 3),
+      fill = FALSE
+    ),
+    layout_columns(
+      card(
+        full_screen = TRUE,
+        card_header(textOutput("protein_chart_title", inline = TRUE)),
+        plotlyOutput("protein_chart")
+      ),
+      card(
+        full_screen = TRUE,
+        card_header("Avg protein by category (top 10)"),
+        plotlyOutput("macro_chart")
+      )
+    )
+  ),
+  nav_panel(
+    "Data",
+    do.call(
+      navset_card_underline,
+      c(
+        lapply(qc$table_names(), function(name) {
+          nav_panel(name, DTOutput(paste0("dt_", name)))
+        }),
+        list(id = "table_tabs", full_screen = TRUE)
+      )
+    )
+  ),
+  fillable = TRUE
+)
+
+server <- function(input, output, session) {
+  qc_vals <- qc$server()
+
+  current_subset <- reactive({
+    ids <- qc_vals$table("foods")$df()[["fdc_id"]]
+    foods_wide[foods_wide$fdc_id %in% ids, ]
+  })
+
+  output$n_foods <- renderText(nrow(current_subset()))
+
+  output$avg_protein <- renderText({
+    v <- mean(current_subset()$protein_g, na.rm = TRUE)
+    if (is.nan(v)) "—" else sprintf("%.1f g", v)
+  })
+
+  output$avg_fiber <- renderText({
+    v <- mean(current_subset()$fiber_g, na.rm = TRUE)
+    if (is.nan(v)) "—" else sprintf("%.1f g", v)
+  })
+
+  output$avg_calories <- renderText({
+    v <- mean(current_subset()$energy_kcal, na.rm = TRUE)
+    if (is.nan(v)) "—" else sprintf("%.0f kcal", v)
+  })
+
+  output$protein_chart_title <- renderText({
+    n <- sum(!is.na(current_subset()$protein_g))
+    sprintf("Top %d foods by protein (g/100g)", min(n, 15L))
+  })
+
+  output$protein_chart <- renderPlotly({
+    df <- current_subset() |>
+      filter(!is.na(protein_g)) |>
+      arrange(desc(protein_g)) |>
+      head(15) |>
+      mutate(label = substr(description, 1, 35))
+
+    plot_ly(
+      df,
+      x = ~protein_g,
+      y = ~ reorder(label, protein_g),
+      type = "bar",
+      orientation = "h",
+      marker = list(color = "#2196F3")
+    ) |>
+      layout(
+        showlegend = FALSE,
+        xaxis = list(title = "Protein (g/100g)"),
+        yaxis = list(title = ""),
+        margin = list(l = 10, r = 40, t = 10, b = 40)
+      )
+  })
+
+  output$macro_chart <- renderPlotly({
+    subset <- current_subset()
+    top_cats <- subset |>
+      count(category, sort = TRUE) |>
+      head(10) |>
+      pull(category)
+
+    agg <- subset |>
+      filter(category %in% top_cats) |>
+      group_by(category) |>
+      summarise(
+        avg_protein = mean(protein_g, na.rm = TRUE),
+        .groups = "drop"
+      ) |>
+      arrange(desc(avg_protein))
+
+    plot_ly(
+      agg,
+      x = ~avg_protein,
+      y = ~ reorder(category, avg_protein),
+      type = "bar",
+      orientation = "h",
+      marker = list(color = "#4CAF50")
+    ) |>
+      layout(
+        showlegend = FALSE,
+        xaxis = list(title = "Avg protein (g/100g)"),
+        yaxis = list(title = ""),
+        margin = list(l = 10, r = 10, t = 10, b = 10)
+      )
+  })
+
+  # Auto-switch tab when LLM queries a table.
+  observe({
+    ct <- qc_vals$current_table()
+    if (!is.null(ct)) {
+      nav_select("table_tabs", selected = ct, session = session)
+    }
+  })
+
+  # Register one DT render per table.
+  # Value boxes and charts above remain tied to the `foods` table — they
+  # use foods-specific wide-format joins and are not generic per-table views.
+  for (tbl_name in qc$table_names()) {
+    local({
+      name <- tbl_name
+      output[[paste0("dt_", name)]] <- renderDT({
+        qc_vals$table(name)$df() |>
+          datatable(
+            fillContainer = TRUE,
+            options = list(pageLength = 25, scrollX = TRUE)
+          )
+      })
+    })
+  }
+}
+
+shinyApp(ui, server)
diff --git a/pkg-r/inst/examples-shiny/11-multi-table-nutrition/data/foodbank/food_categories.parquet b/pkg-r/inst/examples-shiny/11-multi-table-nutrition/data/foodbank/food_categories.parquet
new file mode 100644
index 000000000..10f6d585a
Binary files /dev/null and b/pkg-r/inst/examples-shiny/11-multi-table-nutrition/data/foodbank/food_categories.parquet differ
diff --git a/pkg-r/inst/examples-shiny/11-multi-table-nutrition/data/foodbank/food_nutrients.parquet b/pkg-r/inst/examples-shiny/11-multi-table-nutrition/data/foodbank/food_nutrients.parquet
new file mode 100644
index 000000000..87edd01ac
Binary files /dev/null and b/pkg-r/inst/examples-shiny/11-multi-table-nutrition/data/foodbank/food_nutrients.parquet differ
diff --git a/pkg-r/inst/examples-shiny/11-multi-table-nutrition/data/foodbank/food_portions.parquet b/pkg-r/inst/examples-shiny/11-multi-table-nutrition/data/foodbank/food_portions.parquet
new file mode 100644
index 000000000..b9fc1b411
Binary files /dev/null and b/pkg-r/inst/examples-shiny/11-multi-table-nutrition/data/foodbank/food_portions.parquet differ
diff --git a/pkg-r/inst/examples-shiny/11-multi-table-nutrition/data/foodbank/foods.parquet b/pkg-r/inst/examples-shiny/11-multi-table-nutrition/data/foodbank/foods.parquet
new file mode 100644
index 000000000..c52fd37fe
Binary files /dev/null and b/pkg-r/inst/examples-shiny/11-multi-table-nutrition/data/foodbank/foods.parquet differ
diff --git a/pkg-r/inst/examples-shiny/11-multi-table-nutrition/data/foodbank/measure_units.parquet b/pkg-r/inst/examples-shiny/11-multi-table-nutrition/data/foodbank/measure_units.parquet
new file mode 100644
index 000000000..7a4019495
Binary files /dev/null and b/pkg-r/inst/examples-shiny/11-multi-table-nutrition/data/foodbank/measure_units.parquet differ
diff --git a/pkg-r/inst/examples-shiny/11-multi-table-nutrition/data/foodbank/nutrients.parquet b/pkg-r/inst/examples-shiny/11-multi-table-nutrition/data/foodbank/nutrients.parquet
new file mode 100644
index 000000000..23c533adb
Binary files /dev/null and b/pkg-r/inst/examples-shiny/11-multi-table-nutrition/data/foodbank/nutrients.parquet differ
diff --git a/pkg-r/inst/examples-shiny/11-multi-table-nutrition/nutrition-data-dict.yaml b/pkg-r/inst/examples-shiny/11-multi-table-nutrition/nutrition-data-dict.yaml
new file mode 100644
index 000000000..a8455e6fc
--- /dev/null
+++ b/pkg-r/inst/examples-shiny/11-multi-table-nutrition/nutrition-data-dict.yaml
@@ -0,0 +1,161 @@
+version: "0.2.0"
+
+tables:
+  foods:
+    description: >
+      One row per USDA Foundation Food item. Nutrient values are not stored here —
+      see food_nutrients. All nutrient amounts in food_nutrients are per 100g of the food.
+    columns:
+      - name: fdc_id
+        type: number(id)
+        constraints: [primary_key]
+        description: Unique food identifier from USDA FoodData Central.
+      - name: description
+        type: string
+        description: Full name of the food item (e.g., "Broccoli, raw").
+      - name: food_category_id
+        type: number(id)
+        constraints: [foreign_key]
+        description: Category of the food. Joins to food_categories.id.
+      - name: publication_date
+        type: date
+        description: Date the food record was published by USDA.
+
+  food_categories:
+    description: Lookup table of USDA food categories. One row per category.
+    columns:
+      - name: id
+        type: number(id)
+        constraints: [primary_key]
+        description: Unique category identifier.
+      - name: code
+        type: number
+        description: USDA numeric category code (e.g., 1100 for Vegetables).
+      - name: description
+        type: string
+        description: Human-readable category name (e.g., "Vegetables and Vegetable Products").
+
+  nutrients:
+    description: >
+      Registry of the 12 key nutritional compounds tracked in this dataset.
+      One row per nutrient type. See the glossary for the full list of nutrient IDs.
+    columns:
+      - name: id
+        type: number(id)
+        constraints: [primary_key]
+        description: USDA nutrient identifier (e.g., 1003 for Protein).
+      - name: name
+        type: string
+        description: >
+          Official USDA nutrient name (e.g., "Protein", "Total lipid (fat)",
+          "Carbohydrate, by difference").
+      - name: unit_name
+        type: enum
+        values: [G, KCAL, MG]
+        description: Unit of measurement. G = grams, KCAL = kilocalories, MG = milligrams.
+
+  food_nutrients:
+    description: >
+      Nutrient content per 100g of food. One row per food–nutrient combination.
+      Only the 12 key nutrients are included (see nutrients table and glossary).
+      To get nutrient values for a food, join on fdc_id.
+      To get nutrient names and units, join nutrients on nutrient_id.
+    columns:
+      - name: fdc_id
+        type: number(id)
+        constraints: [foreign_key]
+        description: Identifies the food. Joins to foods.fdc_id.
+      - name: nutrient_id
+        type: number(id)
+        constraints: [foreign_key]
+        description: Identifies the nutrient. Joins to nutrients.id.
+      - name: amount
+        type: number(quantity)
+        description: >
+          Amount of the nutrient per 100g of food, in the unit given by
+          nutrients.unit_name. May be null if the nutrient was not measured
+          for this food.
+
+  food_portions:
+    description: >
+      Common serving sizes for foods. One row per portion definition.
+      A single food may have multiple portions (e.g., "1 cup" and "1 oz").
+      Not all foods have portion data — only 116 of the 436 foods are covered.
+    columns:
+      - name: fdc_id
+        type: number(id)
+        constraints: [foreign_key]
+        description: Identifies the food. Joins to foods.fdc_id.
+      - name: seq_num
+        type: number
+        description: Sequence number ordering multiple portions for the same food.
+      - name: amount
+        type: number(quantity)
+        description: >
+          The number of measure units in this portion (e.g., 1.0 for "1 cup",
+          2.0 for "2 tablespoons").
+      - name: measure_unit_id
+        type: number(id)
+        constraints: [foreign_key]
+        description: Unit of the portion. Joins to measure_units.id.
+      - name: gram_weight
+        type: number(quantity)
+        description: Weight in grams of this portion (e.g., 240 for 1 cup of milk).
+      - name: modifier
+        type: string
+        description: >
+          Optional preparation note for the portion (e.g., "chopped", "drained",
+          "cooked"). Null when no modifier applies.
+
+  measure_units:
+    description: >
+      Lookup table of measurement unit names used in food_portions.
+      Only units that appear in food_portions are included (~32 of the 123 total).
+    columns:
+      - name: id
+        type: number(id)
+        constraints: [primary_key]
+        description: Unique unit identifier.
+      - name: name
+        type: string
+        description: >
+          Human-readable unit name (e.g., "cup", "tablespoon", "oz", "slice",
+          "piece", "package").
+
+relationships:
+  - description: Each food belongs to one category.
+    cardinality: many-to-one
+    join: foods.food_category_id = food_categories.id
+  - description: Each food has one row per tracked nutrient.
+    cardinality: one-to-many
+    join: foods.fdc_id = food_nutrients.fdc_id
+  - description: Each nutrient type appears in many food measurements.
+    cardinality: one-to-many
+    join: nutrients.id = food_nutrients.nutrient_id
+  - description: Each food may have one or more common portion sizes.
+    cardinality: one-to-many
+    join: foods.fdc_id = food_portions.fdc_id
+  - description: Each portion references a measurement unit.
+    cardinality: many-to-one
+    join: food_portions.measure_unit_id = measure_units.id
+
+glossary:
+  per 100g: All nutrient amounts in food_nutrients are normalized to a 100-gram serving for fair comparison across foods.
+  fdc_id: USDA FoodData Central identifier — the primary key for food items in this dataset.
+  energy: Total caloric value, measured in kilocalories (kcal). Nutrient ID 1008.
+  macronutrient: One of the three main energy-providing nutrients — protein (ID 1003), fat (ID 1004), or carbohydrates (ID 1005).
+  nutrient IDs: >
+    Key nutrient IDs in this dataset:
+    1003 = Protein (G),
+    1004 = Total lipid / fat (G),
+    1005 = Carbohydrate by difference (G),
+    1008 = Energy (KCAL),
+    1063 = Sugars Total (G),
+    1079 = Fiber total dietary (G),
+    1258 = Fatty acids total saturated (G),
+    1087 = Calcium Ca (MG),
+    1089 = Iron Fe (MG),
+    1093 = Sodium Na (MG),
+    1162 = Vitamin C total ascorbic acid (MG),
+    1092 = Potassium K (MG).
+  gram_weight: The actual weight in grams of a described portion. Use this to convert per-100g nutrient values to per-serving values by multiplying by (gram_weight / 100).
diff --git a/pkg-r/inst/htmldep/querychat.js b/pkg-r/inst/htmldep/querychat.js
index 326b5e341..3045b2b8e 100644
--- a/pkg-r/inst/htmldep/querychat.js
+++ b/pkg-r/inst/htmldep/querychat.js
@@ -9,11 +9,11 @@
     if (!chatContainer) return;
 
     const chatId = chatContainer.id;
-    const { query, title } = event.target.dataset;
+    const { query, title, table } = event.target.dataset;
 
     window.Shiny.setInputValue(
       chatId + "_update",
-      { query, title },
+      { query, title, table },
       { priority: "event" }
     );
   });
diff --git a/pkg-r/inst/htmldep/schema-display.js b/pkg-r/inst/htmldep/schema-display.js
new file mode 100644
index 000000000..b21376c6c
--- /dev/null
+++ b/pkg-r/inst/htmldep/schema-display.js
@@ -0,0 +1,154 @@
+/* Generated file. Source: js/src/schema-display.js. Do not edit directly. */
+
+"use strict";
+(() => {
+  // src/schema-display.js
+  var lastDisplay = null;
+  var lastDisplayTime = 0;
+  var BATCH_MS = 1e3;
+  var activePanel = null;
+  function parseColumnsJson(json) {
+    return JSON.parse(json).map((col) => ({
+      name: col.name,
+      type: col.sql_type,
+      units: col.units || null,
+      description: col.description || null,
+      constraints: col.constraints && col.constraints.length > 0 ? col.constraints.join(", ") : null,
+      range: col.min_val != null && col.max_val != null ? `${col.min_val} to ${col.max_val}` : null,
+      categories: col.categories && col.categories.length > 0 ? col.categories.map((v) => `'${v}'`).join(", ") : null
+    }));
+  }
+  function esc(s) {
+    return String(s).replace(/&/g, "&amp;").replace(/</g, "&lt;").replace(/>/g, "&gt;").replace(/"/g, "&quot;");
+  }
+  var TH = "padding:0.35em 0.75em;text-align:left;white-space:nowrap;font-weight:600;border-bottom:2px solid var(--bs-border-color,#dee2e6);background:var(--bs-tertiary-bg,#f8f9fa);position:sticky;top:0;z-index:1;";
+  var TD_MONO = "padding:0.3em 0.75em;white-space:nowrap;font-family:var(--bs-font-monospace,monospace);font-size:0.875em;border-bottom:1px solid var(--bs-border-color-translucent,rgba(0,0,0,.08));";
+  var TD_WRAP = "padding:0.3em 0.75em;max-width:22em;overflow-wrap:break-word;border-bottom:1px solid var(--bs-border-color-translucent,rgba(0,0,0,.08));";
+  var TD_NOWRAP = "padding:0.3em 0.75em;white-space:nowrap;border-bottom:1px solid var(--bs-border-color-translucent,rgba(0,0,0,.08));";
+  function renderTable(columns) {
+    const rows = columns.map((col) => {
+      let typeCell = esc(col.type);
+      if (col.units) {
+        typeCell += ` <span style="color:var(--bs-secondary-color,#6c757d)">[${esc(col.units)}]</span>`;
+      }
+      const details = col.range ? esc(col.range) : col.categories ? esc(col.categories) : "";
+      return `<tr><td style="${TD_MONO}">${esc(col.name)}</td><td style="${TD_MONO}">${typeCell}</td><td style="${TD_WRAP}">${col.description ? esc(col.description) : ""}</td><td style="${TD_NOWRAP}">${col.constraints ? esc(col.constraints) : ""}</td><td style="${TD_WRAP}">${details}</td></tr>`;
+    }).join("");
+    return `<table style="border-collapse:collapse;min-width:100%;width:max-content;font-size:0.875em;"><thead><tr><th style="${TH}">Column</th><th style="${TH}">Type</th><th style="${TH}">Description</th><th style="${TH}">Constraints</th><th style="${TH}">Range / Values</th></tr></thead><tbody>${rows}</tbody></table>`;
+  }
+  var PANEL_STYLE = "position:fixed;z-index:9999;background:var(--bs-body-bg,#fff);color:var(--bs-body-color,#212529);border:1px solid var(--bs-border-color,#dee2e6);border-radius:var(--bs-border-radius,0.375rem);box-shadow:0 4px 16px rgba(0,0,0,.15);overflow:auto;max-height:min(420px,60vh);";
+  function positionPanel(btn, panel) {
+    const rect = btn.getBoundingClientRect();
+    const vw = window.innerWidth;
+    const vh = window.innerHeight;
+    const pw = Math.min(Math.max(360, vw * 0.55), vw - 16);
+    panel.style.width = `${pw}px`;
+    panel.style.left = `${Math.max(8, Math.min(rect.left, vw - pw - 8))}px`;
+    const spaceBelow = vh - rect.bottom - 8;
+    const spaceAbove = rect.top - 8;
+    if (spaceBelow >= 120 || spaceBelow >= spaceAbove) {
+      panel.style.top = `${rect.bottom + 4}px`;
+    } else {
+      const panelH = Math.min(420, spaceAbove);
+      panel.style.top = `${Math.max(8, rect.top - panelH - 4)}px`;
+    }
+  }
+  function closePanel() {
+    if (activePanel) {
+      activePanel.panel.hidden = true;
+      activePanel.btn.setAttribute("aria-expanded", "false");
+      activePanel = null;
+    }
+  }
+  document.addEventListener("click", closePanel);
+  document.addEventListener("keydown", (e) => {
+    if (e.key === "Escape") closePanel();
+  });
+  window.addEventListener(
+    "scroll",
+    (e) => {
+      if (activePanel && !activePanel.panel.contains(
+        /** @type {Node} */
+        e.target
+      )) {
+        closePanel();
+      }
+    },
+    true
+  );
+  window.addEventListener("resize", closePanel);
+  function createBtn(tableName, columnsJson) {
+    const columns = parseColumnsJson(columnsJson);
+    const btn = document.createElement("button");
+    btn.type = "button";
+    btn.style.cssText = "background:none;border:none;padding:0;color:inherit;text-decoration:underline dotted;cursor:pointer;font-size:inherit;border-radius:2px;";
+    btn.textContent = tableName;
+    btn.setAttribute("aria-label", `Show schema for ${tableName}`);
+    btn.setAttribute("aria-expanded", "false");
+    btn.setAttribute("aria-haspopup", "dialog");
+    const panel = document.createElement("div");
+    panel.setAttribute("role", "dialog");
+    panel.setAttribute("aria-label", `${tableName} schema`);
+    panel.style.cssText = PANEL_STYLE;
+    panel.hidden = true;
+    panel.innerHTML = renderTable(columns);
+    document.body.appendChild(panel);
+    btn.addEventListener("click", (e) => {
+      e.stopPropagation();
+      if (activePanel && activePanel.panel === panel) {
+        closePanel();
+        return;
+      }
+      closePanel();
+      positionPanel(btn, panel);
+      panel.hidden = false;
+      btn.setAttribute("aria-expanded", "true");
+      activePanel = { btn, panel };
+    });
+    panel.addEventListener("click", (e) => e.stopPropagation());
+    return btn;
+  }
+  var style = document.createElement("style");
+  style.textContent = ".qc-schema-display button:focus-visible{outline:2px solid currentColor;outline-offset:2px;border-radius:2px}";
+  document.head.appendChild(style);
+  function processCollector(sentinel) {
+    const now = Date.now();
+    const tableName = sentinel.dataset.table;
+    const btn = createBtn(tableName, sentinel.dataset.schemaJson);
+    if (lastDisplay && document.contains(lastDisplay) && now - lastDisplayTime < BATCH_MS) {
+      lastDisplay.appendChild(document.createTextNode(", "));
+      lastDisplay.appendChild(btn);
+      sentinel.remove();
+    } else {
+      const p = document.createElement("p");
+      p.className = "qc-schema-display";
+      p.style.cssText = "color:var(--bs-secondary-color,#6c757d);font-size:0.875em;margin:0.1rem 0;";
+      p.appendChild(document.createTextNode("\u{1F50D} Fetched schemas: "));
+      p.appendChild(btn);
+      sentinel.replaceWith(p);
+      lastDisplay = p;
+    }
+    lastDisplayTime = now;
+  }
+  new MutationObserver((mutations) => {
+    for (const { addedNodes } of mutations) {
+      for (const node of addedNodes) {
+        if (node.nodeType !== 1) continue;
+        if (
+          /** @type {Element} */
+          node.classList.contains("qc-schema-collector")
+        ) {
+          processCollector(
+            /** @type {HTMLElement} */
+            node
+          );
+        } else {
+          node.querySelectorAll(".qc-schema-collector").forEach((el) => processCollector(
+            /** @type {HTMLElement} */
+            el
+          ));
+        }
+      }
+    }
+  }).observe(document.body, { subtree: true, childList: true });
+})();
diff --git a/pkg-r/inst/prompts/prompt.md b/pkg-r/inst/prompts/prompt.md
index 93bd100d9..adbbe3c4c 100644
--- a/pkg-r/inst/prompts/prompt.md
+++ b/pkg-r/inst/prompts/prompt.md
@@ -1,20 +1,26 @@
 You are a data dashboard chatbot that operates in a sidebar interface. Your role is to help users interact with their data through filtering, sorting, and answering questions.{{#has_tool_visualize}} You can also help them explore data visually.{{/has_tool_visualize}}
 
-You have access to a {{db_type}} SQL database with the following schema:
+You have access to a {{db_type}} SQL database with the following tables:
 
-<database_schema>
-{{schema}}
-</database_schema>
+{{#has_data_dicts}}
+{{{data_dicts}}}
 
-{{#data_description}}
-Here is additional information about the data:
+{{/has_data_dicts}}
+{{^has_data_dicts}}
+<tables>
+{{{tables_overview}}}
+</tables>
 
+{{/has_data_dicts}}
+{{#data_description}}
 <data_description>
 {{data_description}}
 </data_description>
+
 {{/data_description}}
+Always call `querychat_get_schema` before writing SQL against any table you haven't retrieved schema for in this conversation. Do not infer column names from table names, variable names, or the system prompt alone — verify the actual schema first, then write the query.
 
-For security reasons, you may only query this specific table.
+For security reasons, you may only query {{#multi_table}}these specific tables{{/multi_table}}{{^multi_table}}this specific table{{/multi_table}}.
 
 {{#include_query_guidelines}}
 ## SQL Query Guidelines
@@ -82,18 +88,19 @@ You can handle these types of requests:
 When the user asks you to filter or sort the dashboard, e.g. "Show me..." or "Which ____ have the highest ____?" or "Filter to only include ____":
 
 - Write a {{db_type}} SQL SELECT query
-- Call `querychat_update_dashboard` with the query and a descriptive title
-- The query MUST return all columns from the schema (you can use `SELECT *`)
+- Call `querychat_update_dashboard` with the query, table name, and a descriptive title
+- You MUST specify the `table` parameter to indicate which table to filter
+- The query MUST return all columns from the specified table's schema (you can use `SELECT *`)
 - Use a single SQL query even if complex (subqueries and CTEs are fine)
 - Optimize for **readability over efficiency**
 - Include SQL comments to explain complex logic
 - No confirmation messages are needed: the user will see your query in the dashboard.
 
-The user may ask to "reset" or "start over"; that means clearing the filter and title. Do this by calling `querychat_reset_dashboard()`.
+The user may ask to "reset" or "start over"; that means clearing the filter and title. Do this by calling `querychat_reset_dashboard` with the relevant `table`.
 
 **Filtering Example:**
 User: "Show only rows where sales are above average"
-Tool Call: `querychat_update_dashboard({query: "SELECT * FROM table WHERE sales > (SELECT AVG(sales) FROM table)", title: "Above average sales"})`
+Tool Call: `querychat_update_dashboard({query: "SELECT * FROM sales_data WHERE sales > (SELECT AVG(sales) FROM sales_data)", table: "sales_data", title: "Above average sales"})`
 Response: ""
 
 No further response needed, the user will see the updated dashboard.
@@ -107,6 +114,9 @@ When the user asks you a question about the data, e.g. "What is the average ____
 - Use the `querychat_query` tool to run SQL queries
 - Always use SQL for calculations (counting, averaging, etc.) - NEVER do manual calculations
 - Always present key findings in your response text — do not assume the user can see the tool result (it may be collapsed)
+- If you are unsure whether to set `collapsed`, omit it and use the tool default behavior
+- If you set `collapsed` explicitly, prefer `collapsed=true`; use `collapsed=false` only when the user explicitly asks to see the raw table immediately
+- If you use `collapsed=false`, avoid repeating the same table rows/values in your response text
 - If you cannot complete the request using SQL, politely decline and explain why
 
 **Question Example:**
@@ -122,7 +132,7 @@ You can create visualizations using the `querychat_visualize` tool, which uses g
 
 #### Visualization best practices
 
-The database schema in this prompt includes column names, types, and summary statistics. {{#has_tool_query}}If that context isn't sufficient for a confident visualization — e.g., you're unsure about value distributions, need to check for NULLs, or want to gauge row counts before choosing a chart type — use the `querychat_query` tool to inspect the data before visualizing. Always pass `collapsed=true` for these preparatory queries so the chart remains the focal point of the response.{{/has_tool_query}}
+Use the `querychat_get_schema` tool to retrieve column names, types, and summary statistics for a table before writing visualization queries. {{#has_tool_query}}If that context isn't sufficient for a confident visualization — e.g., you're unsure about value distributions, need to check for NULLs, or want to gauge row counts before choosing a chart type — use the `querychat_query` tool to inspect the data before visualizing. Always pass `collapsed=true` for these preparatory queries so the chart remains the focal point of the response.{{/has_tool_query}}
 
 Follow the principles below to produce clear, interpretable charts.
 
diff --git a/pkg-r/inst/prompts/tool-get-schema.md b/pkg-r/inst/prompts/tool-get-schema.md
new file mode 100644
index 000000000..5447d99b4
--- /dev/null
+++ b/pkg-r/inst/prompts/tool-get-schema.md
@@ -0,0 +1,8 @@
+Retrieve full column details for a table
+
+Returns column names, types, value ranges, categorical values, and descriptions for the specified table.
+
+**When to use this tool:**
+
+- Before writing any SQL query involving a table you have not yet inspected
+- When you are unsure which table is most relevant to the user's request — call this tool on candidate tables to understand their contents before deciding
diff --git a/pkg-r/inst/prompts/tool-query.md b/pkg-r/inst/prompts/tool-query.md
index caa5bb286..b5044ae43 100644
--- a/pkg-r/inst/prompts/tool-query.md
+++ b/pkg-r/inst/prompts/tool-query.md
@@ -19,5 +19,14 @@ Always use SQL for counting, averaging, summing, and other calculations—NEVER
 - Optimize for readability over efficiency—use clear column aliases and SQL comments to explain complex logic
 - Subqueries and CTEs are acceptable and encouraged for complex calculations
 - After receiving results, always present the key findings in your response text — the tool result starts collapsed by default, so don't assume the user has seen the raw data
-- When the result is a single value or small summary, state it directly in prose. When the result is a table that IS the answer, either use a Markdown table in your response or set `collapsed` to `false` — not both
+- If you are unsure whether to control visibility, omit `collapsed` and rely on the tool default behavior
+- If you set `collapsed` explicitly, prefer `collapsed=true`
+- Use `collapsed=false` only when the user explicitly wants the raw table visible immediately (for example, "show me the rows/table")
+- When using `collapsed=false`, avoid duplicating the same rows/values in both the tool result and your response text
 - Do not reproduce large result sets in your response — summarize the key takeaways instead
+
+{{#multi_table}}
+
+**Multi-table queries:** Your schema includes multiple tables. You can reference any table in your queries and use JOINs when the data spans tables. Use the relationships described in the schema to determine join conditions.
+
+{{/multi_table}}
diff --git a/pkg-r/inst/prompts/tool-reset-dashboard.md b/pkg-r/inst/prompts/tool-reset-dashboard.md
index 6aec33464..75f741423 100644
--- a/pkg-r/inst/prompts/tool-reset-dashboard.md
+++ b/pkg-r/inst/prompts/tool-reset-dashboard.md
@@ -2,6 +2,6 @@ Reset the dashboard to its original state
 
 Resets the dashboard to use the original unfiltered dataset and clears any custom title.
 
-If the user asks to reset the dashboard, simply call this tool with no other response. The reset action will be obvious to the user.
+If the user asks to reset the dashboard, call this tool with the relevant table name and no other response. The reset action will be obvious to the user.
 
-If the user asks to start over, call this tool and then provide a new set of suggestions for next steps. Include suggestions that encourage exploration of the data in new directions.
+If the user asks to start over, call this tool with the relevant table name and then provide a new set of suggestions for next steps. Include suggestions that encourage exploration of the data in new directions.
diff --git a/pkg-r/inst/prompts/tool-update-dashboard.md b/pkg-r/inst/prompts/tool-update-dashboard.md
index 96f6ccce5..e0dd35191 100644
--- a/pkg-r/inst/prompts/tool-update-dashboard.md
+++ b/pkg-r/inst/prompts/tool-update-dashboard.md
@@ -1,8 +1,8 @@
 Filter and sort the dashboard data
 
-This tool executes a {{db_type}} SQL SELECT `query` to filter or sort the data used in the dashboard.
+This tool executes a {{db_type}} SQL SELECT query to filter or sort the data used in the dashboard.
 
-**Returns:** A confirmation that the dashboard was updated successfully, or the error that occurred when running the SQL query. The results of the query will update the data shown in the dashboard.
+The `table` parameter specifies which table to filter. Use the table name exactly as shown in the schema.
 
 **When to use:** Call this tool whenever the user requests filtering, sorting, or data manipulation on the dashboard with questions like "Show me..." or "Which records have...". This tool is appropriate for any request that involves showing a subset of the data or reordering it.
 
@@ -15,3 +15,9 @@ This tool executes a {{db_type}} SQL SELECT `query` to filter or sort the data u
 - For statistical filters (stddev, percentiles), use CTEs to calculate thresholds within the query
 - Assume the user will only see the original columns in the dataset
 
+
+{{#multi_table}}
+
+**Multi-table filters:** When filtering a table, you may reference other tables in WHERE clauses, subqueries, or CTEs (e.g., filtering orders by a condition on customers). The result must still return all columns of the target table specified by the `table` parameter.
+
+{{/multi_table}}
diff --git a/pkg-r/inst/prompts/tool-visualize.md b/pkg-r/inst/prompts/tool-visualize.md
index 25680e674..f7b1daf9b 100644
--- a/pkg-r/inst/prompts/tool-visualize.md
+++ b/pkg-r/inst/prompts/tool-visualize.md
@@ -9,3 +9,9 @@ Render a ggsql query (SQL with a VISUALISE clause) as an interactive chart displ
 - All data transformations must happen in the `SELECT` clause. `VISUALISE` and `MAPPING` accept column names only, not SQL expressions or functions.
 - Do NOT include `LABEL title => ...` in the query — use the `title` parameter instead.
 - If a visualization fails, read the error message carefully and retry with a corrected query. Common fixes: correcting column names, adding `SCALE DISCRETE` for integer categories, moving SQL expressions out of `VISUALISE` into the `SELECT` clause, and using `DRAW range` for interval-style marks instead of deprecated `errorbar`.{{#has_tool_query}} If the error persists, fall back to `querychat_query` for a tabular answer.{{/has_tool_query}}
+
+{{#multi_table}}
+
+**Multi-table queries:** The SELECT portion of your ggsql query can reference any table from the schema and use JOINs.
+
+{{/multi_table}}
diff --git a/pkg-r/man/DBISource.Rd b/pkg-r/man/DBISource.Rd
index 86a10b68f..539af25a8 100644
--- a/pkg-r/man/DBISource.Rd
+++ b/pkg-r/man/DBISource.Rd
@@ -37,6 +37,7 @@ db_source$cleanup()
     \item \href{#method-DBISource-initialize}{\code{DBISource$new()}}
     \item \href{#method-DBISource-get_db_type}{\code{DBISource$get_db_type()}}
     \item \href{#method-DBISource-get_schema}{\code{DBISource$get_schema()}}
+    \item \href{#method-DBISource-get_schema_result}{\code{DBISource$get_schema_result()}}
     \item \href{#method-DBISource-get_semantic_views_description}{\code{DBISource$get_semantic_views_description()}}
     \item \href{#method-DBISource-execute_query}{\code{DBISource$execute_query()}}
     \item \href{#method-DBISource-test_query}{\code{DBISource$test_query()}}
@@ -96,7 +97,7 @@ string or a \code{\link[DBI:Id]{DBI::Id()}} object for tables in catalogs/schema
   Get schema information for the database table
   \subsection{Usage}{
     \if{html}{\out{<div class="r">}}
-    \preformatted{DBISource$get_schema(categorical_threshold = 20)}
+    \preformatted{DBISource$get_schema(categorical_threshold = 20, table_spec = NULL)}
     \if{html}{\out{</div>}}
   }
   \subsection{Arguments}{
@@ -112,6 +113,17 @@ column to be considered categorical (default: 20)}
   }
 }
 
+\if{html}{\out{<hr>}}
+\if{html}{\out{<a id="method-DBISource-get_schema_result"></a>}}
+\if{latex}{\out{\hypertarget{method-DBISource-get_schema_result}{}}}
+\subsection{\code{DBISource$get_schema_result()}}{
+  \subsection{Usage}{
+    \if{html}{\out{<div class="r">}}
+    \preformatted{DBISource$get_schema_result(categorical_threshold = 20, table_spec = NULL)}
+    \if{html}{\out{</div>}}
+  }
+}
+
 \if{html}{\out{<hr>}}
 \if{html}{\out{<a id="method-DBISource-get_semantic_views_description"></a>}}
 \if{latex}{\out{\hypertarget{method-DBISource-get_semantic_views_description}{}}}
diff --git a/pkg-r/man/DataFrameSource.Rd b/pkg-r/man/DataFrameSource.Rd
index 0ceb00e3e..b7402f4fa 100644
--- a/pkg-r/man/DataFrameSource.Rd
+++ b/pkg-r/man/DataFrameSource.Rd
@@ -45,17 +45,18 @@ df_sqlite$cleanup()
 \subsection{Public methods}{
   \itemize{
     \item \href{#method-DataFrameSource-initialize}{\code{DataFrameSource$new()}}
+    \item \href{#method-DataFrameSource-cleanup}{\code{DataFrameSource$cleanup()}}
     \item \href{#method-DataFrameSource-clone}{\code{DataFrameSource$clone()}}
   }
 }
 \if{html}{\out{<details><summary>Inherited methods</summary>
 <ul>
   <li><span class="pkg-link" data-pkg="querychat" data-topic="DataSource" data-id="get_data_description"><a href='../../querychat/html/DataSource.html#method-DataSource-get_data_description'><code>DataSource$get_data_description()</code></a></span></li>
-  <li><span class="pkg-link" data-pkg="querychat" data-topic="DBISource" data-id="cleanup"><a href='../../querychat/html/DBISource.html#method-DBISource-cleanup'><code>DBISource$cleanup()</code></a></span></li>
   <li><span class="pkg-link" data-pkg="querychat" data-topic="DBISource" data-id="execute_query"><a href='../../querychat/html/DBISource.html#method-DBISource-execute_query'><code>DBISource$execute_query()</code></a></span></li>
   <li><span class="pkg-link" data-pkg="querychat" data-topic="DBISource" data-id="get_data"><a href='../../querychat/html/DBISource.html#method-DBISource-get_data'><code>DBISource$get_data()</code></a></span></li>
   <li><span class="pkg-link" data-pkg="querychat" data-topic="DBISource" data-id="get_db_type"><a href='../../querychat/html/DBISource.html#method-DBISource-get_db_type'><code>DBISource$get_db_type()</code></a></span></li>
   <li><span class="pkg-link" data-pkg="querychat" data-topic="DBISource" data-id="get_schema"><a href='../../querychat/html/DBISource.html#method-DBISource-get_schema'><code>DBISource$get_schema()</code></a></span></li>
+  <li><span class="pkg-link" data-pkg="querychat" data-topic="DBISource" data-id="get_schema_result"><a href='../../querychat/html/DBISource.html#method-DBISource-get_schema_result'><code>DBISource$get_schema_result()</code></a></span></li>
   <li><span class="pkg-link" data-pkg="querychat" data-topic="DBISource" data-id="get_semantic_views_description"><a href='../../querychat/html/DBISource.html#method-DBISource-get_semantic_views_description'><code>DBISource$get_semantic_views_description()</code></a></span></li>
   <li><span class="pkg-link" data-pkg="querychat" data-topic="DBISource" data-id="test_query"><a href='../../querychat/html/DBISource.html#method-DBISource-test_query'><code>DBISource$test_query()</code></a></span></li>
 </ul>
@@ -93,6 +94,21 @@ engine from duckdb or RSQLite (in that order).}
   }
 }
 
+\if{html}{\out{<hr>}}
+\if{html}{\out{<a id="method-DataFrameSource-cleanup"></a>}}
+\if{latex}{\out{\hypertarget{method-DataFrameSource-cleanup}{}}}
+\subsection{\code{DataFrameSource$cleanup()}}{
+  Disconnect from the database and shut down the DuckDB instance if used.
+  \subsection{Usage}{
+    \if{html}{\out{<div class="r">}}
+    \preformatted{DataFrameSource$cleanup()}
+    \if{html}{\out{</div>}}
+  }
+  \subsection{Returns}{
+    NULL (invisibly)
+  }
+}
+
 \if{html}{\out{<hr>}}
 \if{html}{\out{<a id="method-DataFrameSource-clone"></a>}}
 \if{latex}{\out{\hypertarget{method-DataFrameSource-clone}{}}}
diff --git a/pkg-r/man/DataSource.Rd b/pkg-r/man/DataSource.Rd
index 70ea602af..5ecd8ceee 100644
--- a/pkg-r/man/DataSource.Rd
+++ b/pkg-r/man/DataSource.Rd
@@ -34,6 +34,7 @@ MyDataSource <- R6::R6Class(
   \itemize{
     \item \href{#method-DataSource-get_db_type}{\code{DataSource$get_db_type()}}
     \item \href{#method-DataSource-get_schema}{\code{DataSource$get_schema()}}
+    \item \href{#method-DataSource-get_schema_result}{\code{DataSource$get_schema_result()}}
     \item \href{#method-DataSource-execute_query}{\code{DataSource$execute_query()}}
     \item \href{#method-DataSource-test_query}{\code{DataSource$test_query()}}
     \item \href{#method-DataSource-get_data}{\code{DataSource$get_data()}}
@@ -64,7 +65,7 @@ MyDataSource <- R6::R6Class(
   Get schema information about the table
   \subsection{Usage}{
     \if{html}{\out{<div class="r">}}
-    \preformatted{DataSource$get_schema(categorical_threshold = 20)}
+    \preformatted{DataSource$get_schema(categorical_threshold = 20, table_spec = NULL)}
     \if{html}{\out{</div>}}
   }
   \subsection{Arguments}{
@@ -80,6 +81,17 @@ column to be considered categorical}
   }
 }
 
+\if{html}{\out{<hr>}}
+\if{html}{\out{<a id="method-DataSource-get_schema_result"></a>}}
+\if{latex}{\out{\hypertarget{method-DataSource-get_schema_result}{}}}
+\subsection{\code{DataSource$get_schema_result()}}{
+  \subsection{Usage}{
+    \if{html}{\out{<div class="r">}}
+    \preformatted{DataSource$get_schema_result(categorical_threshold = 20, table_spec = NULL)}
+    \if{html}{\out{</div>}}
+  }
+}
+
 \if{html}{\out{<hr>}}
 \if{html}{\out{<a id="method-DataSource-execute_query"></a>}}
 \if{latex}{\out{\hypertarget{method-DataSource-execute_query}{}}}
diff --git a/pkg-r/man/PinSource.Rd b/pkg-r/man/PinSource.Rd
index 598912f41..34eacf4a9 100644
--- a/pkg-r/man/PinSource.Rd
+++ b/pkg-r/man/PinSource.Rd
@@ -77,6 +77,7 @@ if (rlang::is_installed(c("pins", "duckdb"))) {
   <li><span class="pkg-link" data-pkg="querychat" data-topic="DBISource" data-id="get_data"><a href='../../querychat/html/DBISource.html#method-DBISource-get_data'><code>DBISource$get_data()</code></a></span></li>
   <li><span class="pkg-link" data-pkg="querychat" data-topic="DBISource" data-id="get_db_type"><a href='../../querychat/html/DBISource.html#method-DBISource-get_db_type'><code>DBISource$get_db_type()</code></a></span></li>
   <li><span class="pkg-link" data-pkg="querychat" data-topic="DBISource" data-id="get_schema"><a href='../../querychat/html/DBISource.html#method-DBISource-get_schema'><code>DBISource$get_schema()</code></a></span></li>
+  <li><span class="pkg-link" data-pkg="querychat" data-topic="DBISource" data-id="get_schema_result"><a href='../../querychat/html/DBISource.html#method-DBISource-get_schema_result'><code>DBISource$get_schema_result()</code></a></span></li>
   <li><span class="pkg-link" data-pkg="querychat" data-topic="DBISource" data-id="get_semantic_views_description"><a href='../../querychat/html/DBISource.html#method-DBISource-get_semantic_views_description'><code>DBISource$get_semantic_views_description()</code></a></span></li>
   <li><span class="pkg-link" data-pkg="querychat" data-topic="DBISource" data-id="test_query"><a href='../../querychat/html/DBISource.html#method-DBISource-test_query'><code>DBISource$test_query()</code></a></span></li>
 </ul>
diff --git a/pkg-r/man/QueryChat.Rd b/pkg-r/man/QueryChat.Rd
index 24988177f..c6f759ded 100644
--- a/pkg-r/man/QueryChat.Rd
+++ b/pkg-r/man/QueryChat.Rd
@@ -18,7 +18,7 @@ as input and provides methods to:
 \item Initialize server logic that returns session-specific reactive values (via
 \verb{$server()})
 \item Access reactive data, SQL queries, and titles through the returned server
-values
+values (use \code{qc_vals$table("name")} for multi-table access)
 }
 }
 \section{Usage in Shiny Apps}{
@@ -100,6 +100,8 @@ qc <- QueryChat$new(con, "mtcars")
 
     \item{\code{id}}{ID for the QueryChat instance.}
 
+    \item{\code{id_override}}{Whether the ID was explicitly set by the user.}
+
     \item{\code{tools}}{The allowed tools for the chat client.}
   }
   \if{html}{\out{</div>}}
@@ -109,8 +111,7 @@ qc <- QueryChat$new(con, "mtcars")
   \describe{
     \item{\code{system_prompt}}{Get the system prompt.}
 
-    \item{\code{data_source}}{Get or set the current data source. When setting,
-the value is normalized and the system prompt is rebuilt.}
+    \item{\code{data_source}}{Removed. Use \verb{$add_table()} and \verb{$remove_table()} to manage tables.}
   }
   \if{html}{\out{</div>}}
 }
@@ -118,6 +119,10 @@ the value is normalized and the system prompt is rebuilt.}
 \subsection{Public methods}{
   \itemize{
     \item \href{#method-QueryChat-initialize}{\code{QueryChat$new()}}
+    \item \href{#method-QueryChat-add_table}{\code{QueryChat$add_table()}}
+    \item \href{#method-QueryChat-add_tables}{\code{QueryChat$add_tables()}}
+    \item \href{#method-QueryChat-remove_table}{\code{QueryChat$remove_table()}}
+    \item \href{#method-QueryChat-table_names}{\code{QueryChat$table_names()}}
     \item \href{#method-QueryChat-client}{\code{QueryChat$client()}}
     \item \href{#method-QueryChat-console}{\code{QueryChat$console()}}
     \item \href{#method-QueryChat-app}{\code{QueryChat$app()}}
@@ -149,6 +154,7 @@ the value is normalized and the system prompt is rebuilt.}
   categorical_threshold = 20,
   extra_instructions = NULL,
   prompt_template = NULL,
+  data_dict = NULL,
   cleanup = NA
 )}
     \if{html}{\out{</div>}}
@@ -158,8 +164,8 @@ the value is normalized and the system prompt is rebuilt.}
     \describe{
       \item{\code{data_source}}{Either a data.frame, a database connection (e.g., DBI
 connection), or \code{NULL} to defer setting the data source until later.
-When \code{NULL}, the data source must be set via the \verb{$data_source} property
-or passed to \verb{$server()} before calling methods that require data access.}
+When \code{NULL}, the data source must be added via \verb{$add_table()} or passed
+to \verb{$server()} before calling methods that require data access.}
       \item{\code{table_name}}{A string specifying the table name to use in SQL
 queries. If \code{data_source} is a data.frame, this is the name to refer to
 it by in queries (typically the variable name). If not provided, will
@@ -200,6 +206,8 @@ model in plain text or Markdown. Can be a string or a file path.}
 template file. If not provided, the default querychat template will be
 used. See the package prompts directory for the default template
 format.}
+      \item{\code{data_dict}}{Optional data dictionary. A path to a YAML file, or a
+list of YAML file paths. See \code{\link[=read_data_dict]{read_data_dict()}} for the expected format.}
       \item{\code{cleanup}}{Whether or not to automatically run \verb{$cleanup()} when the
 Shiny session/app stops. By default, cleanup only occurs if \code{QueryChat}
 gets created within a Shiny session. Set to \code{TRUE} to always clean up,
@@ -212,6 +220,96 @@ or \code{FALSE} to never clean up automatically.}
   }
 }
 
+\if{html}{\out{<hr>}}
+\if{html}{\out{<a id="method-QueryChat-add_table"></a>}}
+\if{latex}{\out{\hypertarget{method-QueryChat-add_table}{}}}
+\subsection{\code{QueryChat$add_table()}}{
+  Add a table to this QueryChat instance.
+  \subsection{Usage}{
+    \if{html}{\out{<div class="r">}}
+    \preformatted{QueryChat$add_table(data_source, table_name, replace = FALSE)}
+    \if{html}{\out{</div>}}
+  }
+  \subsection{Arguments}{
+    \if{html}{\out{<div class="arguments">}}
+    \describe{
+      \item{\code{data_source}}{A data frame, database connection, or DataSource object.}
+      \item{\code{table_name}}{The SQL table name for this data source.}
+      \item{\code{replace}}{Whether to replace an existing table with this name.
+Default is \code{FALSE}.}
+    }
+    \if{html}{\out{</div>}}
+  }
+  \subsection{Returns}{
+    Invisibly returns \code{self} for chaining.
+  }
+}
+
+\if{html}{\out{<hr>}}
+\if{html}{\out{<a id="method-QueryChat-add_tables"></a>}}
+\if{latex}{\out{\hypertarget{method-QueryChat-add_tables}{}}}
+\subsection{\code{QueryChat$add_tables()}}{
+  Add multiple tables from a DBI connection in a single call.
+
+Unlike calling \verb{$add_table()} repeatedly, this method builds the
+system prompt exactly once after all tables have been staged, avoiding
+N-1 spurious intermediate rebuilds.
+  \subsection{Usage}{
+    \if{html}{\out{<div class="r">}}
+    \preformatted{QueryChat$add_tables(conn, tables = NULL, replace = FALSE)}
+    \if{html}{\out{</div>}}
+  }
+  \subsection{Arguments}{
+    \if{html}{\out{<div class="arguments">}}
+    \describe{
+      \item{\code{conn}}{A DBI connection. Only DBI connections are supported; pass
+individual data frames or other sources via \verb{$add_table()}.}
+      \item{\code{tables}}{Table names to register. When \code{NULL}, all tables returned
+by \code{DBI::dbListTables(conn)} are used.}
+      \item{\code{replace}}{Whether to replace existing tables with the same name.
+Default is \code{FALSE}.}
+    }
+    \if{html}{\out{</div>}}
+  }
+  \subsection{Returns}{
+    Invisibly returns \code{self} for chaining.
+  }
+}
+
+\if{html}{\out{<hr>}}
+\if{html}{\out{<a id="method-QueryChat-remove_table"></a>}}
+\if{latex}{\out{\hypertarget{method-QueryChat-remove_table}{}}}
+\subsection{\code{QueryChat$remove_table()}}{
+  Remove a table from this QueryChat instance.
+  \subsection{Usage}{
+    \if{html}{\out{<div class="r">}}
+    \preformatted{QueryChat$remove_table(table_name)}
+    \if{html}{\out{</div>}}
+  }
+  \subsection{Arguments}{
+    \if{html}{\out{<div class="arguments">}}
+    \describe{
+      \item{\code{table_name}}{The name of the table to remove.}
+    }
+    \if{html}{\out{</div>}}
+  }
+  \subsection{Returns}{
+    Invisibly returns \code{self} for chaining.
+  }
+}
+
+\if{html}{\out{<hr>}}
+\if{html}{\out{<a id="method-QueryChat-table_names"></a>}}
+\if{latex}{\out{\hypertarget{method-QueryChat-table_names}{}}}
+\subsection{\code{QueryChat$table_names()}}{
+  Return the names of all registered tables.
+  \subsection{Usage}{
+    \if{html}{\out{<div class="r">}}
+    \preformatted{QueryChat$table_names()}
+    \if{html}{\out{</div>}}
+  }
+}
+
 \if{html}{\out{<hr>}}
 \if{html}{\out{<a id="method-QueryChat-client"></a>}}
 \if{latex}{\out{\hypertarget{method-QueryChat-client}{}}}
@@ -222,9 +320,9 @@ data source.
     \if{html}{\out{<div class="r">}}
     \preformatted{QueryChat$client(
   tools = NA,
-  update_dashboard = function(query, title) {
+  update_dashboard = function(query, title, table) {
  },
-  reset_dashboard = function() {
+  reset_dashboard = function(table) {
  },
   visualize = function(data) {
  },
@@ -240,10 +338,10 @@ data source.
 and \code{"query"} includes the tool for executing SQL queries. By default,
 when \code{tools = NA}, the values provided at initialization are used.
 The legacy name \code{"update"} is still accepted as an alias for \code{"filter"}.}
-      \item{\code{update_dashboard}}{Optional function to call with the \code{query} and
-\code{title} generated by the LLM for the \code{update_dashboard} tool.}
+      \item{\code{update_dashboard}}{Optional function to call with the \code{query},
+\code{title}, and \code{table} generated by the LLM for the \code{update_dashboard} tool.}
       \item{\code{reset_dashboard}}{Optional function to call when the
-\code{reset_dashboard} tool is called.}
+\code{reset_dashboard} tool is called. Takes a \code{table} argument.}
       \item{\code{visualize}}{Optional function to call with a list containing
 \code{ggsql}, \code{title}, and \code{widget_id} when a visualization succeeds.}
       \item{\code{session}}{A Shiny session object. Required when \code{"visualize"} is
@@ -285,17 +383,6 @@ By default, only the \code{"query"} tool is included, regardless of the
 \if{latex}{\out{\hypertarget{method-QueryChat-app}{}}}
 \subsection{\code{QueryChat$app()}}{
   Create and run a Shiny gadget for chatting with data
-
-Runs a Shiny gadget (designed for interactive use) that provides a
-complete interface for chatting with your data using natural language. If
-you're looking to deploy this app or run it through some other means, see
-\verb{$app_obj()}.
-
-\if{html}{\out{<div class="sourceCode r">}}\preformatted{library(querychat)
-
-qc <- QueryChat$new(mtcars)
-qc$app()
-}\if{html}{\out{</div>}}
   \subsection{Usage}{
     \if{html}{\out{<div class="r">}}
     \preformatted{QueryChat$app(..., bookmark_store = "url")}
@@ -312,13 +399,7 @@ qc$app()
     \if{html}{\out{</div>}}
   }
   \subsection{Returns}{
-    Invisibly returns a list of session-specific values:
-\itemize{
-\item \code{df}: The final filtered data frame
-\item \code{sql}: The final SQL query string
-\item \code{title}: The final title
-\item \code{client}: The session-specific chat client instance
-}
+    Invisibly returns a list of session-specific values.
   }
 }
 
@@ -327,21 +408,6 @@ qc$app()
 \if{latex}{\out{\hypertarget{method-QueryChat-app_obj}{}}}
 \subsection{\code{QueryChat$app_obj()}}{
   A streamlined Shiny app for chatting with data
-
-Creates a Shiny app designed for chatting with data, with:
-\itemize{
-\item A sidebar containing the chat interface
-\item A card displaying the current SQL query
-\item A card displaying the filtered data table
-\item A reset button to clear the query
-}
-
-\if{html}{\out{<div class="sourceCode r">}}\preformatted{library(querychat)
-
-qc <- QueryChat$new(mtcars)
-app <- qc$app_obj()
-shiny::runApp(app)
-}\if{html}{\out{</div>}}
   \subsection{Usage}{
     \if{html}{\out{<div class="r">}}
     \preformatted{QueryChat$app_obj(..., bookmark_store = "url")}
@@ -352,8 +418,7 @@ shiny::runApp(app)
     \describe{
       \item{\code{...}}{Additional arguments (currently unused).}
       \item{\code{bookmark_store}}{The bookmarking storage method. Passed to
-\code{\link[shiny:enableBookmarking]{shiny::enableBookmarking()}}. If \code{"url"} or \code{"server"}, the chat state
-(including current query) will be bookmarked. Default is \code{"url"}.}
+\code{\link[shiny:enableBookmarking]{shiny::enableBookmarking()}}. Default is \code{"url"}.}
     }
     \if{html}{\out{</div>}}
   }
@@ -367,18 +432,6 @@ shiny::runApp(app)
 \if{latex}{\out{\hypertarget{method-QueryChat-sidebar}{}}}
 \subsection{\code{QueryChat$sidebar()}}{
   Create a sidebar containing the querychat UI.
-
-This method generates a \code{\link[bslib:sidebar]{bslib::sidebar()}} component containing the chat
-interface, suitable for use with \code{\link[bslib:page_sidebar]{bslib::page_sidebar()}} or similar
-layouts.
-
-\if{html}{\out{<div class="sourceCode r">}}\preformatted{qc <- QueryChat$new(mtcars)
-
-ui <- page_sidebar(
-  qc$sidebar(),
-  # Main content here
-)
-}\if{html}{\out{</div>}}
   \subsection{Usage}{
     \if{html}{\out{<div class="r">}}
     \preformatted{QueryChat$sidebar(
@@ -398,10 +451,7 @@ ui <- page_sidebar(
       \item{\code{height}}{Height of the sidebar. Default is "100\%".}
       \item{\code{fillable}}{Whether the sidebar should be fillable. Default is
 \code{TRUE}.}
-      \item{\code{id}}{Optional ID for the QueryChat instance. If not provided, will
-use the ID provided at initialization. If using \verb{$sidebar()} in a Shiny
-module, you'll need to provide \code{id = ns("your_id")} where \code{ns} is the
-namespacing function from \code{\link[shiny:NS]{shiny::NS()}}.}
+      \item{\code{id}}{Optional ID for the QueryChat instance.}
     }
     \if{html}{\out{</div>}}
   }
@@ -415,16 +465,6 @@ namespacing function from \code{\link[shiny:NS]{shiny::NS()}}.}
 \if{latex}{\out{\hypertarget{method-QueryChat-ui}{}}}
 \subsection{\code{QueryChat$ui()}}{
   Create the UI for the querychat chat interface.
-
-This method generates the chat UI component. Typically you'll use
-\verb{$sidebar()} instead, which wraps this in a sidebar layout.
-
-\if{html}{\out{<div class="sourceCode r">}}\preformatted{qc <- QueryChat$new(mtcars)
-
-ui <- fluidPage(
-  qc$ui()
-)
-}\if{html}{\out{</div>}}
   \subsection{Usage}{
     \if{html}{\out{<div class="r">}}
     \preformatted{QueryChat$ui(..., id = NULL)}
@@ -434,10 +474,7 @@ ui <- fluidPage(
     \if{html}{\out{<div class="arguments">}}
     \describe{
       \item{\code{...}}{Additional arguments passed to \code{\link[shinychat:chat_ui]{shinychat::chat_ui()}}.}
-      \item{\code{id}}{Optional ID for the QueryChat instance. If not provided,
-will use the ID provided at initialization. If using \verb{$ui()} in a Shiny
-module, you'll need to provide \code{id = ns("your_id")} where \code{ns} is the
-namespacing function from \code{\link[shiny:NS]{shiny::NS()}}.}
+      \item{\code{id}}{Optional ID for the QueryChat instance.}
     }
     \if{html}{\out{</div>}}
   }
@@ -451,21 +488,6 @@ namespacing function from \code{\link[shiny:NS]{shiny::NS()}}.}
 \if{latex}{\out{\hypertarget{method-QueryChat-server}{}}}
 \subsection{\code{QueryChat$server()}}{
   Initialize the querychat server logic.
-
-This method must be called within a Shiny server function. It sets up the
-reactive logic for the chat interface and returns session-specific
-reactive values.
-
-\if{html}{\out{<div class="sourceCode r">}}\preformatted{qc <- QueryChat$new(mtcars)
-
-server <- function(input, output, session) \{
-  qc_vals <- qc$server(enable_bookmarking = TRUE)
-
-  output$data <- renderDataTable(qc_vals$df())
-  output$query <- renderText(qc_vals$sql())
-  output$title <- renderText(qc_vals$title() \%||\% "No Query")
-\}
-}\if{html}{\out{</div>}}
   \subsection{Usage}{
     \if{html}{\out{<div class="r">}}
     \preformatted{QueryChat$server(
@@ -481,40 +503,23 @@ server <- function(input, output, session) \{
   \subsection{Arguments}{
     \if{html}{\out{<div class="arguments">}}
     \describe{
-      \item{\code{data_source}}{Optional data source to use. If provided, sets the
-data_source property before initializing server logic. This is useful
-for the deferred pattern where data_source is not known at
-initialization time (e.g., when the data source depends on session-
-specific authentication).}
-      \item{\code{client}}{Optional chat client override for this session. Can be an
-\link[ellmer:Chat]{ellmer::Chat} object or a string (e.g., \code{"openai/gpt-4o"}). If provided,
-overrides the client set at initialization for this session only —
-other sessions are unaffected. This is useful when the client must be
-created within a session scope (e.g., Posit Connect managed credentials).}
-      \item{\code{enable_bookmarking}}{Whether to enable bookmarking for the chat
-state. Default is \code{FALSE}. When enabled, the chat state (including
-current query, title, and chat history) will be saved and restored
-with Shiny bookmarks. This requires that the Shiny app has bookmarking
-enabled via \code{shiny::enableBookmarking()} or the \code{enableBookmarking}
-parameter of \code{shiny::shinyApp()}.}
+      \item{\code{data_source}}{Optional data source for backward compatibility.
+If provided, calls \verb{$add_table()} before initializing server logic.}
+      \item{\code{client}}{Optional chat client override for this session.}
+      \item{\code{enable_bookmarking}}{Whether to enable bookmarking. Default is \code{FALSE}.}
       \item{\code{...}}{Ignored.}
-      \item{\code{id}}{Optional module ID for the QueryChat instance. If not provided,
-will use the ID provided at initialization. When used in Shiny modules,
-this \code{id} should match the \code{id} used in the corresponding UI function
-(i.e., \code{qc$ui(id = ns("your_id"))} pairs with \code{qc$server(id = "your_id")}).}
+      \item{\code{id}}{Optional module ID override.}
       \item{\code{session}}{The Shiny session object.}
     }
     \if{html}{\out{</div>}}
   }
   \subsection{Returns}{
     A list containing session-specific reactive values and the chat
-client with the following elements:
-\itemize{
-\item \code{df}: Reactive expression returning the current filtered data frame
-\item \code{sql}: Reactive value for the current SQL query string
-\item \code{title}: Reactive value for the current title
-\item \code{client}: The session-specific chat client instance
-}
+client. For single-table usage, includes \code{df}, \code{sql}, \code{title} directly.
+For multi-table, use \code{qc_vals$table("name")} to get a \link{TableAccessor}
+with per-table reactive state. Also includes \code{table_names()} to list tables.
+\code{current_table()} returns the name of the most recently queried table,
+or \code{NULL} before any query.
   }
 }
 
@@ -523,22 +528,6 @@ client with the following elements:
 \if{latex}{\out{\hypertarget{method-QueryChat-generate_greeting}{}}}
 \subsection{\code{QueryChat$generate_greeting()}}{
   Generate a welcome greeting for the chat.
-
-By default, \code{QueryChat$new()} generates a greeting at the start of every
-new conversation, which is convenient for getting started and
-development, but also might add unnecessary latency and cost. Use this
-method to generate a greeting once and save it for reuse.
-
-\if{html}{\out{<div class="sourceCode r">}}\preformatted{# Create QueryChat object
-qc <- QueryChat$new(mtcars)
-
-# Generate a greeting and save it
-greeting <- qc$generate_greeting()
-writeLines(greeting, "mtcars_greeting.md")
-
-# Later, use the saved greeting
-qc2 <- QueryChat$new(mtcars, greeting = "mtcars_greeting.md")
-}\if{html}{\out{</div>}}
   \subsection{Usage}{
     \if{html}{\out{<div class="r">}}
     \preformatted{QueryChat$generate_greeting(echo = c("none", "output"))}
@@ -547,8 +536,7 @@ qc2 <- QueryChat$new(mtcars, greeting = "mtcars_greeting.md")
   \subsection{Arguments}{
     \if{html}{\out{<div class="arguments">}}
     \describe{
-      \item{\code{echo}}{Whether to print the greeting to the console. Options are
-\code{"none"} (default, no output) or \code{"output"} (print to console).}
+      \item{\code{echo}}{Whether to print the greeting to the console.}
     }
     \if{html}{\out{</div>}}
   }
@@ -562,13 +550,6 @@ qc2 <- QueryChat$new(mtcars, greeting = "mtcars_greeting.md")
 \if{latex}{\out{\hypertarget{method-QueryChat-cleanup}{}}}
 \subsection{\code{QueryChat$cleanup()}}{
   Clean up resources associated with the data source.
-
-This method releases any resources (e.g., database connections)
-associated with the data source. Call this when you are done using the
-QueryChat object to avoid resource leaks.
-
-Note: If \code{auto_cleanup} was set to \code{TRUE} in the constructor, this will
-be called automatically when the Shiny app stops.
   \subsection{Usage}{
     \if{html}{\out{<div class="r">}}
     \preformatted{QueryChat$cleanup()}
diff --git a/pkg-r/man/TableAccessor.Rd b/pkg-r/man/TableAccessor.Rd
new file mode 100644
index 000000000..9b8557bdd
--- /dev/null
+++ b/pkg-r/man/TableAccessor.Rd
@@ -0,0 +1,106 @@
+% Generated by roxygen2: do not edit by hand
+% Please edit documentation in R/TableAccessor.R
+\name{TableAccessor}
+\alias{TableAccessor}
+\title{Table Accessor}
+\description{
+Accessor for a specific table's data source and per-table reactive state.
+Returned by the server return value's \verb{$table("name")} method.
+}
+\keyword{internal}
+\section{Active bindings}{
+  \if{html}{\out{<div class="r6-active-bindings">}}
+  \describe{
+    \item{\code{table_name}}{The name of this table.}
+
+    \item{\code{data_source}}{The DataSource for this table.}
+  }
+  \if{html}{\out{</div>}}
+}
+\section{Methods}{
+\subsection{Public methods}{
+  \itemize{
+    \item \href{#method-TableAccessor-initialize}{\code{TableAccessor$new()}}
+    \item \href{#method-TableAccessor-df}{\code{TableAccessor$df()}}
+    \item \href{#method-TableAccessor-sql}{\code{TableAccessor$sql()}}
+    \item \href{#method-TableAccessor-title}{\code{TableAccessor$title()}}
+    \item \href{#method-TableAccessor-clone}{\code{TableAccessor$clone()}}
+  }
+}
+\if{html}{\out{<hr>}}
+\if{html}{\out{<a id="method-TableAccessor-initialize"></a>}}
+\if{latex}{\out{\hypertarget{method-TableAccessor-initialize}{}}}
+\subsection{\code{TableAccessor$new()}}{
+  Create a new TableAccessor.
+  \subsection{Usage}{
+    \if{html}{\out{<div class="r">}}
+    \preformatted{TableAccessor$new(table_name, data_source, state)}
+    \if{html}{\out{</div>}}
+  }
+  \subsection{Arguments}{
+    \if{html}{\out{<div class="arguments">}}
+    \describe{
+      \item{\code{table_name}}{The name of the table.}
+      \item{\code{data_source}}{The DataSource for this table.}
+      \item{\code{state}}{List of per-table reactive state (\code{sql}, \code{title}, \code{df}).}
+    }
+    \if{html}{\out{</div>}}
+  }
+}
+
+\if{html}{\out{<hr>}}
+\if{html}{\out{<a id="method-TableAccessor-df"></a>}}
+\if{latex}{\out{\hypertarget{method-TableAccessor-df}{}}}
+\subsection{\code{TableAccessor$df()}}{
+  Return the current filtered data for this table.
+  \subsection{Usage}{
+    \if{html}{\out{<div class="r">}}
+    \preformatted{TableAccessor$df()}
+    \if{html}{\out{</div>}}
+  }
+}
+
+\if{html}{\out{<hr>}}
+\if{html}{\out{<a id="method-TableAccessor-sql"></a>}}
+\if{latex}{\out{\hypertarget{method-TableAccessor-sql}{}}}
+\subsection{\code{TableAccessor$sql()}}{
+  Return the current SQL filter for this table.
+  \subsection{Usage}{
+    \if{html}{\out{<div class="r">}}
+    \preformatted{TableAccessor$sql()}
+    \if{html}{\out{</div>}}
+  }
+}
+
+\if{html}{\out{<hr>}}
+\if{html}{\out{<a id="method-TableAccessor-title"></a>}}
+\if{latex}{\out{\hypertarget{method-TableAccessor-title}{}}}
+\subsection{\code{TableAccessor$title()}}{
+  Return the current filter title for this table.
+  \subsection{Usage}{
+    \if{html}{\out{<div class="r">}}
+    \preformatted{TableAccessor$title()}
+    \if{html}{\out{</div>}}
+  }
+}
+
+\if{html}{\out{<hr>}}
+\if{html}{\out{<a id="method-TableAccessor-clone"></a>}}
+\if{latex}{\out{\hypertarget{method-TableAccessor-clone}{}}}
+\subsection{\code{TableAccessor$clone()}}{
+  The objects of this class are cloneable with this method.
+  \subsection{Usage}{
+    \if{html}{\out{<div class="r">}}
+    \preformatted{TableAccessor$clone(deep = FALSE)}
+    \if{html}{\out{</div>}}
+  }
+  \subsection{Arguments}{
+    \if{html}{\out{<div class="arguments">}}
+    \describe{
+      \item{\code{deep}}{Whether to make a deep clone.}
+    }
+    \if{html}{\out{</div>}}
+  }
+}
+
+}
diff --git a/pkg-r/man/TblSqlSource.Rd b/pkg-r/man/TblSqlSource.Rd
index af4bb42be..f15a1cccc 100644
--- a/pkg-r/man/TblSqlSource.Rd
+++ b/pkg-r/man/TblSqlSource.Rd
@@ -46,6 +46,7 @@ mtcars_source$cleanup()
     \item \href{#method-TblSqlSource-initialize}{\code{TblSqlSource$new()}}
     \item \href{#method-TblSqlSource-get_db_type}{\code{TblSqlSource$get_db_type()}}
     \item \href{#method-TblSqlSource-get_schema}{\code{TblSqlSource$get_schema()}}
+    \item \href{#method-TblSqlSource-get_schema_result}{\code{TblSqlSource$get_schema_result()}}
     \item \href{#method-TblSqlSource-execute_query}{\code{TblSqlSource$execute_query()}}
     \item \href{#method-TblSqlSource-test_query}{\code{TblSqlSource$test_query()}}
     \item \href{#method-TblSqlSource-prep_query}{\code{TblSqlSource$prep_query()}}
@@ -106,7 +107,7 @@ string, or will be inferred from the \code{tbl} argument, if possible.}
   Get schema information about the table
   \subsection{Usage}{
     \if{html}{\out{<div class="r">}}
-    \preformatted{TblSqlSource$get_schema(categorical_threshold = 20)}
+    \preformatted{TblSqlSource$get_schema(categorical_threshold = 20, table_spec = NULL)}
     \if{html}{\out{</div>}}
   }
   \subsection{Arguments}{
@@ -122,6 +123,17 @@ column to be considered categorical}
   }
 }
 
+\if{html}{\out{<hr>}}
+\if{html}{\out{<a id="method-TblSqlSource-get_schema_result"></a>}}
+\if{latex}{\out{\hypertarget{method-TblSqlSource-get_schema_result}{}}}
+\subsection{\code{TblSqlSource$get_schema_result()}}{
+  \subsection{Usage}{
+    \if{html}{\out{<div class="r">}}
+    \preformatted{TblSqlSource$get_schema_result(categorical_threshold = 20, table_spec = NULL)}
+    \if{html}{\out{</div>}}
+  }
+}
+
 \if{html}{\out{<hr>}}
 \if{html}{\out{<a id="method-TblSqlSource-execute_query"></a>}}
 \if{latex}{\out{\hypertarget{method-TblSqlSource-execute_query}{}}}
diff --git a/pkg-r/man/execute_ggsql.Rd b/pkg-r/man/execute_ggsql.Rd
index 3713aab02..532af74ae 100644
--- a/pkg-r/man/execute_ggsql.Rd
+++ b/pkg-r/man/execute_ggsql.Rd
@@ -2,12 +2,12 @@
 % Please edit documentation in R/querychat_viz.R
 \name{execute_ggsql}
 \alias{execute_ggsql}
-\title{Execute a pre-validated ggsql query against a DataSource}
+\title{Execute a pre-validated ggsql query against an executor}
 \usage{
-execute_ggsql(data_source, validated)
+execute_ggsql(executor, validated)
 }
 \arguments{
-\item{data_source}{A querychat DataSource R6 object.}
+\item{executor}{A querychat QueryExecutor R6 object.}
 
 \item{validated}{A pre-validated ggsql query (from \code{ggsql::ggsql_validate()}).
 Must be a list with \verb{$sql} and \verb{$visual} fields.}
@@ -16,7 +16,7 @@ Must be a list with \verb{$sql} and \verb{$visual} fields.}
 A \code{ggsql::Spec} R6 object (the writer-independent plot specification).
 }
 \description{
-Executes the SQL portion through a DataSource (preserving database pushdown),
+Executes the SQL portion through an executor (preserving database pushdown),
 then feeds the result into a ggsql DuckDB reader to produce a Spec.
 }
 \keyword{internal}
diff --git a/pkg-r/man/querychat-convenience.Rd b/pkg-r/man/querychat-convenience.Rd
index 9a0a63ddd..5be1320fb 100644
--- a/pkg-r/man/querychat-convenience.Rd
+++ b/pkg-r/man/querychat-convenience.Rd
@@ -17,6 +17,7 @@ querychat(
   categorical_threshold = 20,
   extra_instructions = NULL,
   prompt_template = NULL,
+  data_dict = NULL,
   cleanup = NA
 )
 
@@ -32,6 +33,7 @@ querychat_app(
   categorical_threshold = 20,
   extra_instructions = NULL,
   prompt_template = NULL,
+  data_dict = NULL,
   cleanup = NA,
   bookmark_store = "url"
 )
@@ -40,66 +42,33 @@ querychat_app(
 \item{data_source}{Either a data.frame or a database connection (e.g., DBI
 connection).}
 
-\item{table_name}{A string specifying the table name to use in SQL queries.
-If \code{data_source} is a data.frame, this is the name to refer to it by in
-queries (typically the variable name). If not provided, will be inferred
-from the variable name for data.frame inputs. For database connections,
-this parameter is required.}
+\item{table_name}{A string specifying the table name to use in SQL queries.}
 
 \item{...}{Additional arguments (currently unused).}
 
-\item{id}{Optional module ID for the QueryChat instance. If not provided,
-will be auto-generated from \code{table_name}. The ID is used to namespace
-the Shiny module.}
+\item{id}{Optional module ID for the QueryChat instance.}
 
-\item{greeting}{Optional initial message to display to users. Can be a
-character string (in Markdown format) or a file path. If not provided,
-a greeting will be generated at the start of each conversation using the
-LLM, which adds latency and cost. Use \verb{$generate_greeting()} to create
-a greeting to save and reuse.}
+\item{greeting}{Optional initial message to display to users.}
 
-\item{client}{Optional chat client. Can be:
-\itemize{
-\item An \link[ellmer:Chat]{ellmer::Chat} object
-\item A string to pass to \code{\link[ellmer:chat]{ellmer::chat()}} (e.g., \code{"openai/gpt-4o"})
-\item \code{NULL} (default): Uses the \code{querychat.client} option, the
-\code{QUERYCHAT_CLIENT} environment variable, or defaults to
-\code{\link[ellmer:chat_openai]{ellmer::chat_openai()}}
-}}
+\item{client}{Optional chat client.}
 
-\item{tools}{Which querychat tools to include in the chat client, by
-default. \code{"filter"} includes the tools for filtering and resetting the
-dashboard and \code{"query"} includes the tool for executing SQL queries.
-Use \code{tools = "filter"} when you only want the dashboard filtering tools,
-or when you want to disable the querying tool entirely to prevent the
-LLM from seeing any of the data in your dataset. The legacy name
-\code{"update"} is still accepted as an alias for \code{"filter"}.}
+\item{tools}{Which querychat tools to include in the chat client.}
 
-\item{data_description}{Optional description of the data in plain text or
-Markdown. Can be a string or a file path. This provides context to the
-LLM about what the data represents.}
+\item{data_description}{Optional description of the data.}
 
 \item{categorical_threshold}{For text columns, the maximum number of unique
 values to consider as a categorical variable. Default is 20.}
 
-\item{extra_instructions}{Optional additional instructions for the chat
-model in plain text or Markdown. Can be a string or a file path.}
+\item{extra_instructions}{Optional additional instructions for the chat model.}
 
-\item{prompt_template}{Optional path to or string of a custom prompt
-template file. If not provided, the default querychat template will be
-used. See the package prompts directory for the default template format.}
+\item{prompt_template}{Optional path to or string of a custom prompt template.}
 
-\item{cleanup}{Whether or not to automatically run \verb{$cleanup()} when the
-Shiny session/app stops. By default, cleanup only occurs if \code{QueryChat}
-is created within a Shiny app. Set to \code{TRUE} to always clean up, or
-\code{FALSE} to never clean up automatically.
+\item{data_dict}{Optional data dictionary. A path to a YAML file or a list of paths.}
 
-In \code{querychat_app()}, in-memory databases created for data frames are
-always cleaned up.}
+\item{cleanup}{Whether or not to automatically run \verb{$cleanup()} when the
+Shiny session/app stops.}
 
-\item{bookmark_store}{The bookmarking storage method. Passed to
-\code{\link[shiny:enableBookmarking]{shiny::enableBookmarking()}}. If \code{"url"} or \code{"server"}, the chat state
-(including current query) will be bookmarked. Default is \code{"url"}.}
+\item{bookmark_store}{The bookmarking storage method. Default is \code{"url"}.}
 }
 \value{
 A \code{QueryChat} object. See \link{QueryChat} for available methods.
@@ -114,23 +83,5 @@ and app launching (i.e., \code{querychat_app()}).
 \dontshow{if (rlang::is_interactive() && rlang::is_installed("RSQLite")) withAutoprint(\{ # examplesIf}
 # Quick start - chat with mtcars dataset in one line
 querychat_app(mtcars)
-
-# Add options
-querychat_app(
-  mtcars,
-  greeting = "Welcome to the mtcars explorer!",
-  client = "openai/gpt-4o"
-)
-
-# Chat with a database table (table_name required)
-con <- DBI::dbConnect(RSQLite::SQLite(), ":memory:")
-DBI::dbWriteTable(con, "mtcars", mtcars)
-querychat_app(con, "mtcars")
-
-# Create QueryChat class object
-qc <- querychat(mtcars, greeting = "Welcome to the mtcars explorer!")
-
-# Run the app later
-qc$app()
 \dontshow{\}) # examplesIf}
 }
diff --git a/pkg-r/man/read_data_dict.Rd b/pkg-r/man/read_data_dict.Rd
new file mode 100644
index 000000000..25c43271d
--- /dev/null
+++ b/pkg-r/man/read_data_dict.Rd
@@ -0,0 +1,22 @@
+% Generated by roxygen2: do not edit by hand
+% Please edit documentation in R/DataDict.R
+\name{read_data_dict}
+\alias{read_data_dict}
+\title{Read a Data Dictionary from YAML}
+\usage{
+read_data_dict(path)
+}
+\arguments{
+\item{path}{Path to the YAML file.}
+}
+\value{
+A named list with the structure of the YAML file.
+}
+\description{
+Loads a data dictionary from a YAML file conforming to the
+\href{https://data-dict.tidyverse.org/}{data-dict spec}. The dictionary is
+returned as a plain list and can be passed directly to \link{QueryChat} via the
+\code{data_dict} argument.
+
+If \code{name} is absent from the YAML file, it defaults to the file stem.
+}
diff --git a/pkg-r/pkgdown/_pkgdown.yml b/pkg-r/pkgdown/_pkgdown.yml
index 2312aa5ab..364231216 100644
--- a/pkg-r/pkgdown/_pkgdown.yml
+++ b/pkg-r/pkgdown/_pkgdown.yml
@@ -69,6 +69,8 @@ reference:
   contents:
   - querychat
   - QueryChat
+  - TableAccessor
+  - read_data_dict
 - title: Data sources
   contents:
   - ends_with("Source")
diff --git a/pkg-r/tests/testthat/_snaps/querychat_tools.md b/pkg-r/tests/testthat/_snaps/querychat_tools.md
index eea808c30..a1a4c875d 100644
--- a/pkg-r/tests/testthat/_snaps/querychat_tools.md
+++ b/pkg-r/tests/testthat/_snaps/querychat_tools.md
@@ -1,44 +1,29 @@
-# tool_update_dashboard() checks inputs
+# tool_update_dashboard() checks update_fn inputs
 
     Code
-      tool_update_dashboard("foo")
-    Condition
-      Error in `tool_update_dashboard()`:
-      ! `data_source` must be a <DataSource> object, not a string.
-
----
-
-    Code
-      tool_update_dashboard(df_source, update_fn = NULL)
+      tool_update_dashboard(executor, "test_table", update_fn = NULL)
     Condition
       Error in `tool_update_dashboard()`:
       ! `update_fn` must be a function, not `NULL`.
     Code
-      tool_update_dashboard(df_source, update_fn = function(query) { })
+      tool_update_dashboard(executor, "test_table", update_fn = function(query) { })
     Condition
       Error in `tool_update_dashboard()`:
-      ! `update_fn` must accept at least two named arguments: "query" and "title".
-      x "title" argument was missing.
+      ! `update_fn` must accept at least three named arguments: "query", "title", and "table".
+      x "title" and "table" arguments were missing.
     Code
-      tool_update_dashboard(df_source, update_fn = function(title, extra) { })
+      tool_update_dashboard(executor, "test_table", update_fn = function(title, extra)
+        { })
     Condition
       Error in `tool_update_dashboard()`:
-      ! `update_fn` must accept at least two named arguments: "query" and "title".
-      x "query" argument was missing.
+      ! `update_fn` must accept at least three named arguments: "query", "title", and "table".
+      x "query" and "table" arguments were missing.
 
 # tool_reset_dashboard() checks inputs
 
     Code
-      tool_reset_dashboard("not_a_function")
+      tool_reset_dashboard("not_a_function", table_names = "t")
     Condition
       Error in `tool_reset_dashboard()`:
       ! `reset_fn` must be a function, not the string "not_a_function".
 
-# tool_query() checks inputs
-
-    Code
-      tool_query("invalid_source")
-    Condition
-      Error in `tool_query()`:
-      ! `data_source` must be a <DataSource> object, not a string.
-
diff --git a/pkg-r/tests/testthat/helper-fixtures.R b/pkg-r/tests/testthat/helper-fixtures.R
index d800b0106..3775b84ee 100644
--- a/pkg-r/tests/testthat/helper-fixtures.R
+++ b/pkg-r/tests/testthat/helper-fixtures.R
@@ -1,5 +1,10 @@
 # Test fixture constructors for data source tests
 
+# Access the internal data source for a named table (test helper only)
+qc_data_source <- function(qc, table_name) {
+  qc$.__enclos_env__$private$.data_sources[[table_name]]
+}
+
 # Simple data frame with id, name, and value columns
 new_test_df <- function(rows = 5) {
   data.frame(
diff --git a/pkg-r/tests/testthat/test-DBISource.R b/pkg-r/tests/testthat/test-DBISource.R
index 69ff7be26..487052ff4 100644
--- a/pkg-r/tests/testthat/test-DBISource.R
+++ b/pkg-r/tests/testthat/test-DBISource.R
@@ -82,9 +82,11 @@ describe("DBISource$test_query()", {
 
     expect_error(dbi_source$test_query("SELECT * FROM non_existent_table"))
 
-    expect_error(dbi_source$test_query(
-      "SELECT non_existent_column FROM test_table"
-    ))
+    expect_error(
+      dbi_source$test_query(
+        "SELECT non_existent_column FROM test_table"
+      )
+    )
   })
 
   it("works with different data types", {
diff --git a/pkg-r/tests/testthat/test-DataDict.R b/pkg-r/tests/testthat/test-DataDict.R
new file mode 100644
index 000000000..f10aab403
--- /dev/null
+++ b/pkg-r/tests/testthat/test-DataDict.R
@@ -0,0 +1,154 @@
+describe("read_data_dict()", {
+  it("reads a YAML file and returns a plain list", {
+    yaml_file <- withr::local_tempfile(fileext = ".yaml")
+    writeLines(
+      c(
+        "name: test",
+        "description: Test domain",
+        "tables:",
+        "  orders:",
+        "    description: Orders table",
+        "    columns:",
+        "      - name: id",
+        "        type: integer",
+        "        description: Primary key",
+        "relationships:",
+        "  - join: orders.customer_id = customers.id",
+        "    description: Order belongs to customer",
+        "    cardinality: many-to-one",
+        "glossary:",
+        "  ARR: Annual Recurring Revenue"
+      ),
+      yaml_file
+    )
+
+    dd <- read_data_dict(yaml_file)
+    expect_true(is.list(dd))
+    expect_equal(dd[["name"]], "test")
+    expect_equal(dd[["description"]], "Test domain")
+    expect_true(is.list(dd[["tables"]][["orders"]]))
+    expect_equal(dd[["tables"]][["orders"]][["description"]], "Orders table")
+    expect_length(dd[["tables"]][["orders"]][["columns"]], 1)
+    expect_equal(dd[["tables"]][["orders"]][["columns"]][[1]][["name"]], "id")
+    expect_length(dd[["relationships"]], 1)
+    expect_equal(
+      dd[["relationships"]][[1]][["join"]],
+      "orders.customer_id = customers.id"
+    )
+    expect_equal(dd[["glossary"]][["ARR"]], "Annual Recurring Revenue")
+  })
+
+  it("defaults name to file stem when not in YAML", {
+    yaml_file <- withr::local_tempfile(fileext = ".yaml")
+    writeLines("description: No name here", yaml_file)
+
+    dd <- read_data_dict(yaml_file)
+    expect_equal(dd[["name"]], tools::file_path_sans_ext(basename(yaml_file)))
+  })
+
+  it("reads a YAML with column range and values", {
+    yaml_file <- withr::local_tempfile(fileext = ".yaml")
+    writeLines(
+      c(
+        "tables:",
+        "  products:",
+        "    columns:",
+        "      - name: price",
+        "        range:",
+        "          min: 0",
+        "          max: 999",
+        "      - name: category",
+        "        values: [A, B, C]"
+      ),
+      yaml_file
+    )
+
+    dd <- read_data_dict(yaml_file)
+    cols <- dd[["tables"]][["products"]][["columns"]]
+    price_col <- cols[[1]]
+    cat_col <- cols[[2]]
+
+    expect_equal(price_col[["range"]][["min"]], 0)
+    expect_equal(price_col[["range"]][["max"]], 999)
+    expect_equal(cat_col[["values"]], c("A", "B", "C"))
+  })
+})
+
+describe("data_dict_to_prompt_list()", {
+  it("returns list with name and description", {
+    dd <- list(name = "sales", description = "Sales domain")
+    result <- data_dict_to_prompt_list(dd)
+    expect_equal(result[["name"]], "sales")
+    expect_equal(result[["description"]], "Sales domain")
+  })
+
+  it("omits NULL name and description", {
+    dd <- list()
+    result <- data_dict_to_prompt_list(dd)
+    expect_false("name" %in% names(result))
+    expect_false("description" %in% names(result))
+  })
+
+  it("includes table descriptions but strips column details", {
+    dd <- list(
+      tables = list(
+        orders = list(
+          description = "Orders table",
+          details = "Long details that should not appear",
+          columns = list(
+            list(name = "id", description = "PK", details = "Internal only")
+          )
+        )
+      )
+    )
+    result <- data_dict_to_prompt_list(dd)
+    expect_true("tables" %in% names(result))
+    expect_equal(
+      result[["tables"]][["orders"]][["description"]],
+      "Orders table"
+    )
+    expect_null(result[["tables"]][["orders"]][["columns"]])
+    expect_null(result[["tables"]][["orders"]][["details"]])
+  })
+
+  it("includes relationships as list of non-NULL fields", {
+    dd <- list(
+      relationships = list(
+        list(
+          join = "a.id = b.id",
+          description = "A to B",
+          cardinality = "one-to-many"
+        )
+      )
+    )
+    result <- data_dict_to_prompt_list(dd)
+    expect_true("relationships" %in% names(result))
+    expect_length(result[["relationships"]], 1)
+    rel <- result[["relationships"]][[1]]
+    expect_equal(rel[["join"]], "a.id = b.id")
+    expect_equal(rel[["description"]], "A to B")
+    expect_equal(rel[["cardinality"]], "one-to-many")
+  })
+
+  it("includes glossary", {
+    dd <- list(glossary = list(ARR = "Annual Recurring Revenue"))
+    result <- data_dict_to_prompt_list(dd)
+    expect_true("glossary" %in% names(result))
+    expect_equal(result[["glossary"]][["ARR"]], "Annual Recurring Revenue")
+  })
+
+  it("omits empty tables, relationships, glossary", {
+    dd <- list()
+    result <- data_dict_to_prompt_list(dd)
+    expect_false("tables" %in% names(result))
+    expect_false("relationships" %in% names(result))
+    expect_false("glossary" %in% names(result))
+  })
+
+  it("includes table entry as NULL when table has no description", {
+    dd <- list(tables = list(no_desc = list()))
+    result <- data_dict_to_prompt_list(dd)
+    expect_true("tables" %in% names(result))
+    expect_null(result[["tables"]][["no_desc"]])
+  })
+})
diff --git a/pkg-r/tests/testthat/test-DataSource.R b/pkg-r/tests/testthat/test-DataSource.R
index cf2fc0468..7defe8c21 100644
--- a/pkg-r/tests/testthat/test-DataSource.R
+++ b/pkg-r/tests/testthat/test-DataSource.R
@@ -29,7 +29,6 @@ describe("DataSource base class", {
   })
 })
 
-
 describe("DataSource$get_schema()", {
   it("returns proper schema for DataFrameSource", {
     skip_if_no_dataframe_engine()
@@ -311,7 +310,6 @@ describe("DataSource$execute_query()", {
   })
 })
 
-
 describe("test_query() column validation", {
   skip_if_no_dataframe_engine()
 
diff --git a/pkg-r/tests/testthat/test-PinSource.R b/pkg-r/tests/testthat/test-PinSource.R
index 3c2f1e05e..2230dc31f 100644
--- a/pkg-r/tests/testthat/test-PinSource.R
+++ b/pkg-r/tests/testthat/test-PinSource.R
@@ -391,7 +391,7 @@ describe("QueryChat + PinSource integration", {
     prompt_before <- qc$system_prompt
     expect_match(prompt_before, "Motor Trend Cars")
 
-    qc$data_source <- new_test_df()
+    qc$add_table(new_test_df(), 'cars', replace = TRUE)
     prompt_after <- qc$system_prompt
     expect_no_match(prompt_after, "Motor Trend Cars")
 
diff --git a/pkg-r/tests/testthat/test-QueryChat.R b/pkg-r/tests/testthat/test-QueryChat.R
index cbbf20994..99313737d 100644
--- a/pkg-r/tests/testthat/test-QueryChat.R
+++ b/pkg-r/tests/testthat/test-QueryChat.R
@@ -9,8 +9,8 @@ describe("QueryChat$new()", {
     )
     withr::defer(qc$cleanup())
 
-    expect_s3_class(qc$data_source, "DataSource")
-    expect_s3_class(qc$data_source, "DataFrameSource")
+    expect_s3_class(qc_data_source(qc, "test_df"), "DataSource")
+    expect_s3_class(qc_data_source(qc, "test_df"), "DataFrameSource")
   })
 
   it("accepts DataFrameSource directly", {
@@ -22,8 +22,8 @@ describe("QueryChat$new()", {
       greeting = "Test greeting"
     )
 
-    expect_s3_class(qc$data_source, "DataFrameSource")
-    expect_equal(qc$data_source$table_name, "test_source")
+    expect_s3_class(qc_data_source(qc, "test_source"), "DataFrameSource")
+    expect_equal(qc_data_source(qc, "test_source")$table_name, "test_source")
   })
 
   it("accepts DBISource", {
@@ -36,8 +36,8 @@ describe("QueryChat$new()", {
       greeting = "Test greeting"
     )
 
-    expect_s3_class(qc$data_source, "DBISource")
-    expect_equal(qc$data_source$table_name, "test_table")
+    expect_s3_class(qc_data_source(qc, "test_table"), "DBISource")
+    expect_equal(qc_data_source(qc, "test_table")$table_name, "test_table")
   })
 
   it("infers table_name from data.frame variable name", {
@@ -45,7 +45,7 @@ describe("QueryChat$new()", {
     qc <- QueryChat$new(my_data, greeting = "Test")
     withr::defer(qc$cleanup())
 
-    expect_equal(qc$data_source$table_name, "my_data")
+    expect_equal(qc_data_source(qc, "my_data")$table_name, "my_data")
     expect_equal(qc$id, "querychat_my_data")
   })
 
@@ -104,7 +104,7 @@ describe("QueryChat$new()", {
 describe("QueryChat deferred client", {
   it("accepts NULL data_source with table_name", {
     qc <- QueryChat$new(NULL, "users", greeting = "Test")
-    expect_null(qc$data_source)
+    expect_equal(length(qc$table_names()), 0L)
     expect_equal(qc$id, "querychat_users")
   })
 
@@ -119,41 +119,53 @@ describe("QueryChat deferred client", {
     withr::local_envvar(OPENAI_API_KEY = NA)
     withr::local_options(querychat.client = NULL)
     qc <- QueryChat$new(NULL, "users", greeting = "Test")
-    expect_null(qc$data_source)
+    expect_equal(length(qc$table_names()), 0L)
   })
 
   it("stores explicit client string as spec", {
     withr::local_envvar(OPENAI_API_KEY = "boop")
     qc <- QueryChat$new(NULL, "users", greeting = "Test", client = "openai")
-    expect_null(qc$data_source)
+    expect_equal(length(qc$table_names()), 0L)
   })
 
   it("$client() errors when data_source is NULL", {
     qc <- QueryChat$new(NULL, "users", greeting = "Test")
-    expect_error(qc$client(), "data_source.*must be set")
+    expect_error(
+      qc$client(),
+      "data_source.*must be set|data_source.*set before"
+    )
   })
 
   it("$console() errors when data_source is NULL", {
     qc <- QueryChat$new(NULL, "users", greeting = "Test")
-    expect_error(qc$console(), "data_source.*must be set")
+    expect_error(
+      qc$console(),
+      "data_source.*must be set|data_source.*set before"
+    )
   })
 
   it("$generate_greeting() errors when data_source is NULL", {
     qc <- QueryChat$new(NULL, "users", greeting = "Test")
-    expect_error(qc$generate_greeting(), "data_source.*must be set")
+    expect_error(
+      qc$generate_greeting(),
+      "data_source.*must be set|data_source.*set before"
+    )
   })
 
   it("$system_prompt errors when data_source is NULL", {
     qc <- QueryChat$new(NULL, "users", greeting = "Test")
-    expect_error(qc$system_prompt, "data_source.*must be set")
+    expect_error(
+      qc$system_prompt,
+      "data_source.*must be set|data_source.*set before"
+    )
   })
 
-  it("works after setting data_source later", {
+  it("works after adding table via add_table()", {
     skip_if_no_dataframe_engine()
     qc <- QueryChat$new(NULL, "users", greeting = "Test")
-    qc$data_source <- new_users_df()
+    qc$add_table(new_users_df(), "users")
 
-    expect_s3_class(qc$data_source, "DataFrameSource")
+    expect_s3_class(qc_data_source(qc, "users"), "DataFrameSource")
     prompt <- qc$system_prompt
     expect_match(prompt, "users")
   })
@@ -186,15 +198,16 @@ describe("QueryChat integration with DBISource", {
       client = mock_client
     )
 
-    expect_s3_class(qc$data_source, "DBISource")
-    expect_s3_class(qc$data_source, "DataSource")
+    iris_source <- qc_data_source(qc, "iris")
+    expect_s3_class(iris_source, "DBISource")
+    expect_s3_class(iris_source, "DataSource")
 
-    result_data <- qc$data_source$execute_query(NULL)
+    result_data <- iris_source$execute_query(NULL)
     expect_s3_class(result_data, "data.frame")
     expect_equal(nrow(result_data), 150)
     expect_equal(ncol(result_data), 5)
 
-    query_result <- qc$data_source$execute_query(
+    query_result <- iris_source$execute_query(
       "SELECT \"Sepal.Length\", \"Sepal.Width\" FROM iris WHERE \"Species\" = 'setosa'"
     )
     expect_s3_class(query_result, "data.frame")
@@ -293,16 +306,20 @@ describe("QueryChat$system_prompt", {
 describe("QueryChat$data_source", {
   skip_if_no_dataframe_engine()
 
-  it("returns the data source object", {
+  it("errors when accessed (removed)", {
     test_df <- new_test_df()
     qc <- QueryChat$new(test_df, greeting = "Test")
     withr::defer(qc$cleanup())
 
-    ds <- qc$data_source
+    expect_error(qc$data_source, "removed")
+  })
 
-    expect_s3_class(ds, "DataSource")
-    expect_s3_class(ds, "DataFrameSource")
-    expect_equal(ds$table_name, "test_df")
+  it("errors when set (removed)", {
+    test_df <- new_test_df()
+    qc <- QueryChat$new(test_df, greeting = "Test")
+    withr::defer(qc$cleanup())
+
+    expect_error(qc$data_source <- test_df, "removed")
   })
 })
 
@@ -334,7 +351,7 @@ describe("QueryChat$client()", {
 
     client <- qc$client(tools = "query")
 
-    # Should only have query tool
+    # Should only have query tool (plus get_schema)
     tool_names <- sapply(client$get_tools(), function(t) t@name)
     expect_contains(tool_names, "querychat_query")
     expect_false("querychat_update_dashboard" %in% tool_names)
@@ -451,7 +468,7 @@ describe("QueryChat$client()", {
     client <- qc$client(tools = "visualize")
 
     tool_names <- sapply(client$get_tools(), function(t) t@name)
-    expect_equal(unname(tool_names), "querychat_visualize")
+    expect_contains(tool_names, "querychat_visualize")
   })
 
   it("registers only visualize tool when tools = 'visualize'", {
@@ -473,7 +490,11 @@ describe("QueryChat$client()", {
     client <- qc$client(tools = "visualize", session = session)
 
     tool_names <- sapply(client$get_tools(), function(t) t@name)
-    expect_equal(unname(tool_names), "querychat_visualize")
+    # get_schema is always registered when tools != NULL
+    expect_contains(tool_names, "querychat_visualize")
+    expect_false("querychat_update_dashboard" %in% tool_names)
+    expect_false("querychat_reset_dashboard" %in% tool_names)
+    expect_false("querychat_query" %in% tool_names)
   })
 
   it("returns client with no tools when tools = NULL", {
@@ -520,8 +541,8 @@ describe("QueryChat$client()", {
     update_calls <- list()
     client <- qc$client(
       tools = "update",
-      update_dashboard = function(query, title) {
-        update_calls <<- list(query = query, title = title)
+      update_dashboard = function(query, title, table) {
+        update_calls <<- list(query = query, title = title, table = table)
       }
     )
 
@@ -538,12 +559,14 @@ describe("QueryChat$client()", {
     # Call the tool - it should execute the query and call the callback
     result <- update_tool(
       query = "SELECT * FROM test_df WHERE id = 1",
-      title = "Test Filter"
+      title = "Test Filter",
+      table = "test_df"
     )
 
     expect_null(result@error)
     expect_equal(update_calls$query, "SELECT * FROM test_df WHERE id = 1")
     expect_equal(update_calls$title, "Test Filter")
+    expect_equal(update_calls$table, "test_df")
   })
 
   it("passes reset_dashboard callback to tool", {
@@ -553,11 +576,11 @@ describe("QueryChat$client()", {
     )
     withr::defer(qc$cleanup())
 
-    reset_called <- FALSE
+    reset_called_with <- NULL
     client <- qc$client(
       tools = "update",
-      reset_dashboard = function() {
-        reset_called <<- TRUE
+      reset_dashboard = function(table) {
+        reset_called_with <<- table
       }
     )
 
@@ -572,9 +595,9 @@ describe("QueryChat$client()", {
     ]]
 
     # Call the tool
-    reset_tool()
+    reset_tool("test_df")
 
-    expect_true(reset_called)
+    expect_equal(reset_called_with, "test_df")
   })
 
   it("returns independent client instances on each call", {
@@ -675,7 +698,7 @@ describe("querychat()", {
     withr::defer(qc$cleanup())
 
     expect_s3_class(qc, "QueryChat")
-    expect_s3_class(qc$data_source, "DataFrameSource")
+    expect_s3_class(qc_data_source(qc, "test_df"), "DataFrameSource")
     expect_equal(qc$greeting, "Test greeting")
   })
 
@@ -684,7 +707,10 @@ describe("querychat()", {
     qc <- querychat(my_test_data, greeting = "Test")
     withr::defer(qc$cleanup())
 
-    expect_equal(qc$data_source$table_name, "my_test_data")
+    expect_equal(
+      qc_data_source(qc, "my_test_data")$table_name,
+      "my_test_data"
+    )
   })
 
   it("passes all arguments to QueryChat$new()", {
@@ -702,7 +728,7 @@ describe("querychat()", {
 
     expect_equal(qc$id, "custom_id")
     expect_equal(qc$greeting, "Custom greeting")
-    expect_equal(qc$data_source$table_name, "custom_name")
+    expect_equal(qc_data_source(qc, "custom_name")$table_name, "custom_name")
   })
 })
 
@@ -734,7 +760,8 @@ describe("QueryChat$console()", {
     expect_s3_class(console_client, "Chat")
 
     tools <- console_client$get_tools()
-    expect_equal(names(tools), "querychat_query")
+    tool_names <- names(tools)
+    expect_contains(tool_names, "querychat_query")
   })
 
   it("persists console client across calls", {
@@ -782,7 +809,7 @@ describe("QueryChat$console()", {
     expect_s3_class(console_client, "Chat")
 
     tools <- console_client$get_tools()
-    expect_setequal(
+    expect_contains(
       names(tools),
       c(
         "querychat_query",
@@ -900,10 +927,9 @@ describe("QueryChat deferred client with $server()", {
     )
   })
 
-  it("$server(data_source=...) sets the data_source", {
+  it("$server(data_source=...) errors without Shiny session", {
     skip_if_no_dataframe_engine()
     qc <- QueryChat$new(NULL, "users", greeting = "Test")
-    expect_null(qc$data_source)
 
     expect_error(
       qc$server(data_source = new_users_df()),
@@ -911,3 +937,105 @@ describe("QueryChat deferred client with $server()", {
     )
   })
 })
+
+describe("QueryChat$add_tables()", {
+  local_multi_table_conn <- function(env = parent.frame()) {
+    skip_if_not_installed("RSQLite")
+    conn <- DBI::dbConnect(RSQLite::SQLite(), ":memory:")
+    withr::defer(DBI::dbDisconnect(conn), envir = env)
+    DBI::dbWriteTable(
+      conn,
+      "orders",
+      data.frame(id = 1:2, amount = c(9.99, 4.50))
+    )
+    DBI::dbWriteTable(
+      conn,
+      "customers",
+      data.frame(id = 1:2, name = c("Alice", "Bob"))
+    )
+    conn
+  }
+
+  it("auto-discovery registers all tables", {
+    conn <- local_multi_table_conn()
+    qc <- QueryChat$new(NULL, "placeholder", greeting = "Test")
+    suppressWarnings(qc$add_tables(conn))
+    expect_setequal(qc$table_names(), c("orders", "customers"))
+  })
+
+  it("explicit tables registers only those", {
+    conn <- local_multi_table_conn()
+    qc <- QueryChat$new(NULL, "placeholder", greeting = "Test")
+    qc$add_tables(conn, tables = "orders")
+    expect_equal(qc$table_names(), "orders")
+  })
+
+  it("nonexistent table name raises error", {
+    conn <- local_multi_table_conn()
+    qc <- QueryChat$new(NULL, "placeholder", greeting = "Test")
+    expect_error(
+      qc$add_tables(conn, tables = "nonexistent"),
+      "not found"
+    )
+  })
+
+  it("duplicate without replace raises error", {
+    conn <- local_multi_table_conn()
+    qc <- QueryChat$new(NULL, "placeholder", greeting = "Test")
+    qc$add_tables(conn, tables = "orders")
+    expect_error(
+      qc$add_tables(conn, tables = "orders"),
+      "already exists"
+    )
+  })
+
+  it("replace = TRUE on existing table succeeds", {
+    conn <- local_multi_table_conn()
+    qc <- QueryChat$new(NULL, "placeholder", greeting = "Test")
+    qc$add_tables(conn, tables = "orders")
+    expect_no_error(qc$add_tables(conn, tables = "orders", replace = TRUE))
+    expect_true("orders" %in% qc$table_names())
+  })
+
+  it("non-DBI argument raises error", {
+    qc <- QueryChat$new(NULL, "placeholder", greeting = "Test")
+    expect_error(
+      qc$add_tables(new_test_df()),
+      "DBIConnection"
+    )
+  })
+
+  it("empty tables vector raises error", {
+    conn <- local_multi_table_conn()
+    qc <- QueryChat$new(NULL, "placeholder", greeting = "Test")
+    expect_error(
+      qc$add_tables(conn, tables = character(0)),
+      "No tables found"
+    )
+  })
+
+  it("calling after server initialization raises error", {
+    conn <- local_multi_table_conn()
+    qc <- QueryChat$new(NULL, "placeholder", greeting = "Test")
+    qc$.__enclos_env__$private$.server_initialized <- TRUE
+    expect_error(
+      qc$add_tables(conn),
+      "after server initialization"
+    )
+  })
+
+  it("system prompt built exactly once for multiple tables", {
+    conn <- local_multi_table_conn()
+    qc <- QueryChat$new(NULL, "placeholder", greeting = "Test")
+    warns <- character(0)
+    withCallingHandlers(
+      qc$add_tables(conn),
+      warning = function(w) {
+        warns <<- c(warns, conditionMessage(w))
+        invokeRestart("muffleWarning")
+      }
+    )
+    multi_table_warns <- warns[grepl("Multiple tables", warns)]
+    expect_length(multi_table_warns, 1L)
+  })
+})
diff --git a/pkg-r/tests/testthat/test-QueryChatSystemPrompt.R b/pkg-r/tests/testthat/test-QueryChatSystemPrompt.R
index 5bf3e88e5..59894650f 100644
--- a/pkg-r/tests/testthat/test-QueryChatSystemPrompt.R
+++ b/pkg-r/tests/testthat/test-QueryChatSystemPrompt.R
@@ -8,12 +8,11 @@ describe("QueryChatSystemPrompt$new()", {
 
     sp <- QueryChatSystemPrompt$new(
       prompt_template = "Template: {{schema}}",
-      data_source = ds
+      data_sources = list(test_table = ds)
     )
 
     expect_type(sp$template, "character")
     expect_true(grepl("Template:", sp$template))
-    expect_type(sp$schema, "character")
     expect_equal(sp$categorical_threshold, 10)
   })
 
@@ -27,7 +26,7 @@ describe("QueryChatSystemPrompt$new()", {
 
     sp <- QueryChatSystemPrompt$new(
       prompt_template = temp_file,
-      data_source = ds
+      data_sources = list(test_table = ds)
     )
 
     expect_type(sp$template, "character")
@@ -41,7 +40,7 @@ describe("QueryChatSystemPrompt$new()", {
 
     sp <- QueryChatSystemPrompt$new(
       prompt_template = "Template",
-      data_source = ds,
+      data_sources = list(test_table = ds),
       data_description = "Test data description"
     )
 
@@ -58,7 +57,7 @@ describe("QueryChatSystemPrompt$new()", {
 
     sp <- QueryChatSystemPrompt$new(
       prompt_template = "Template",
-      data_source = ds,
+      data_sources = list(test_table = ds),
       data_description = temp_file
     )
 
@@ -72,7 +71,7 @@ describe("QueryChatSystemPrompt$new()", {
 
     sp <- QueryChatSystemPrompt$new(
       prompt_template = "Template",
-      data_source = ds,
+      data_sources = list(test_table = ds),
       extra_instructions = "Extra instructions here"
     )
 
@@ -89,7 +88,7 @@ describe("QueryChatSystemPrompt$new()", {
 
     sp <- QueryChatSystemPrompt$new(
       prompt_template = "Template",
-      data_source = ds,
+      data_sources = list(test_table = ds),
       extra_instructions = temp_file
     )
 
@@ -103,7 +102,7 @@ describe("QueryChatSystemPrompt$new()", {
 
     sp <- QueryChatSystemPrompt$new(
       prompt_template = "Template",
-      data_source = ds,
+      data_sources = list(test_table = ds),
       categorical_threshold = 25
     )
 
@@ -117,7 +116,7 @@ describe("QueryChatSystemPrompt$new()", {
 
     sp <- QueryChatSystemPrompt$new(
       prompt_template = "Template",
-      data_source = ds
+      data_sources = list(test_table = ds)
     )
 
     expect_null(sp$data_description)
@@ -140,7 +139,7 @@ describe("QueryChatSystemPrompt$render()", {
 
     sp <- QueryChatSystemPrompt$new(
       prompt_template = template,
-      data_source = ds
+      data_sources = list(test_table = ds)
     )
 
     result <- sp$render(c("update", "query"))
@@ -164,7 +163,7 @@ describe("QueryChatSystemPrompt$render()", {
 
     sp <- QueryChatSystemPrompt$new(
       prompt_template = template,
-      data_source = ds
+      data_sources = list(test_table = ds)
     )
 
     result <- sp$render("query")
@@ -188,7 +187,7 @@ describe("QueryChatSystemPrompt$render()", {
 
     sp <- QueryChatSystemPrompt$new(
       prompt_template = template,
-      data_source = ds
+      data_sources = list(test_table = ds)
     )
 
     result <- sp$render("update")
@@ -213,7 +212,7 @@ describe("QueryChatSystemPrompt$render()", {
 
     sp <- QueryChatSystemPrompt$new(
       prompt_template = template,
-      data_source = ds
+      data_sources = list(test_table = ds)
     )
 
     result <- sp$render(NULL)
@@ -231,7 +230,7 @@ describe("QueryChatSystemPrompt$render()", {
 
     sp <- QueryChatSystemPrompt$new(
       prompt_template = "Schema: {{schema}}",
-      data_source = ds
+      data_sources = list(test_table = ds)
     )
 
     result <- sp$render(NULL)
@@ -247,7 +246,7 @@ describe("QueryChatSystemPrompt$render()", {
 
     sp <- QueryChatSystemPrompt$new(
       prompt_template = "Database: {{db_type}}",
-      data_source = ds
+      data_sources = list(test_table = ds)
     )
 
     result <- sp$render(NULL)
@@ -268,7 +267,7 @@ describe("QueryChatSystemPrompt$render()", {
 
     sp <- QueryChatSystemPrompt$new(
       prompt_template = template,
-      data_source = ds,
+      data_sources = list(test_table = ds),
       data_description = "My test data"
     )
 
@@ -290,7 +289,7 @@ describe("QueryChatSystemPrompt$render()", {
 
     sp <- QueryChatSystemPrompt$new(
       prompt_template = template,
-      data_source = ds
+      data_sources = list(test_table = ds)
     )
 
     result <- sp$render(NULL)
@@ -311,7 +310,7 @@ describe("QueryChatSystemPrompt$render()", {
 
     sp <- QueryChatSystemPrompt$new(
       prompt_template = template,
-      data_source = ds,
+      data_sources = list(test_table = ds),
       extra_instructions = "Be concise"
     )
 
@@ -333,7 +332,7 @@ describe("QueryChatSystemPrompt$render()", {
 
     sp <- QueryChatSystemPrompt$new(
       prompt_template = template,
-      data_source = ds
+      data_sources = list(test_table = ds)
     )
 
     result <- sp$render(NULL)
@@ -351,7 +350,7 @@ describe("QueryChatSystemPrompt$render()", {
 
     sp <- QueryChatSystemPrompt$new(
       prompt_template = template,
-      data_source = ds
+      data_sources = list(test_table = ds)
     )
 
     result <- sp$render(NULL)
@@ -367,7 +366,7 @@ describe("QueryChatSystemPrompt$render()", {
 
     sp <- QueryChatSystemPrompt$new(
       prompt_template = "Simple template",
-      data_source = ds
+      data_sources = list(test_table = ds)
     )
 
     result <- sp$render(NULL)
@@ -389,7 +388,7 @@ describe("QueryChatSystemPrompt with full prompt.md template", {
         "prompt.md",
         package = "querychat"
       ),
-      data_source = ds,
+      data_sources = list(test_table = ds),
       data_description = "A test dataframe"
     )
     prompt <- sp$render(NULL)
@@ -397,7 +396,7 @@ describe("QueryChatSystemPrompt with full prompt.md template", {
     expect_type(prompt, "character")
     expect_true(nchar(prompt) > 0)
     expect_match(prompt, "A test dataframe")
-    expect_match(prompt, "Table: test_table")
+    expect_match(prompt, "test_table")
   })
 
   it("includes DuckDB-specific content for DuckDB sources", {
@@ -411,7 +410,7 @@ describe("QueryChatSystemPrompt with full prompt.md template", {
         "prompt.md",
         package = "querychat"
       ),
-      data_source = ds
+      data_sources = list(test_table = ds)
     )
     sys_prompt <- sp$render(NULL)
 
@@ -419,8 +418,7 @@ describe("QueryChatSystemPrompt with full prompt.md template", {
     expect_true(grepl("DuckDB SQL Tips", sys_prompt, fixed = TRUE))
   })
 
-  it("handles categorical_threshold with full template", {
-    # Create a source with categorical data
+  it("stores categorical_threshold for on-demand schema", {
     df_with_categories <- data.frame(
       id = 1:10,
       category = rep(c("A", "B", "C", "D", "E"), each = 2)
@@ -428,31 +426,18 @@ describe("QueryChatSystemPrompt with full prompt.md template", {
     cat_source <- DataFrameSource$new(df_with_categories, "test_table")
     withr::defer(cat_source$cleanup())
 
-    # With low threshold, categories should not be listed
-    sp_low <- QueryChatSystemPrompt$new(
+    sp <- QueryChatSystemPrompt$new(
       prompt_template = system.file(
         "prompts",
         "prompt.md",
         package = "querychat"
       ),
-      data_source = cat_source,
+      data_sources = list(test_table = cat_source),
       categorical_threshold = 3
     )
-    prompt_low <- sp_low$render(NULL)
-    expect_false(grepl("Categorical values:", prompt_low))
-
-    # With high threshold, categories should be listed
-    sp_high <- QueryChatSystemPrompt$new(
-      prompt_template = system.file(
-        "prompts",
-        "prompt.md",
-        package = "querychat"
-      ),
-      data_source = cat_source,
-      categorical_threshold = 10
-    )
-    prompt_high <- sp_high$render(NULL)
-    expect_match(prompt_high, "Categorical values:")
+    expect_equal(sp$categorical_threshold, 3)
+    prompt <- sp$render(NULL)
+    expect_match(prompt, "querychat_get_schema")
   })
 })
 
@@ -467,7 +452,7 @@ describe("viz prompt conditionals", {
     ds <- local_data_frame_source(new_test_df())
     sp <- QueryChatSystemPrompt$new(
       prompt_template = default_prompt(),
-      data_source = ds
+      data_sources = list(test_table = ds)
     )
     rendered <- sp$render(tools = c("query", "visualize"))
     expect_match(rendered, "querychat_visualize")
@@ -479,7 +464,7 @@ describe("viz prompt conditionals", {
     ds <- local_data_frame_source(new_test_df())
     sp <- QueryChatSystemPrompt$new(
       prompt_template = default_prompt(),
-      data_source = ds
+      data_sources = list(test_table = ds)
     )
     rendered <- sp$render(tools = c("query"))
     expect_no_match(rendered, "querychat_visualize")
@@ -489,7 +474,7 @@ describe("viz prompt conditionals", {
     ds <- local_data_frame_source(new_test_df())
     sp <- QueryChatSystemPrompt$new(
       prompt_template = default_prompt(),
-      data_source = ds
+      data_sources = list(test_table = ds)
     )
     rendered <- sp$render(tools = c("query"))
     expect_match(rendered, "visualization is not currently enabled")
@@ -499,7 +484,7 @@ describe("viz prompt conditionals", {
     ds <- local_data_frame_source(new_test_df())
     sp <- QueryChatSystemPrompt$new(
       prompt_template = default_prompt(),
-      data_source = ds
+      data_sources = list(test_table = ds)
     )
     rendered <- sp$render(tools = c("visualize"))
     expect_match(rendered, "ggsql-syntax-reference")
@@ -516,7 +501,7 @@ describe("viz prompt conditionals", {
     ds <- local_data_frame_source(new_test_df())
     sp <- QueryChatSystemPrompt$new(
       prompt_template = default_prompt(),
-      data_source = ds
+      data_sources = list(test_table = ds)
     )
     rendered <- sp$render(tools = c("query", "visualize"))
     expect_match(rendered, "Avoid redundant expanded results")
@@ -526,66 +511,9 @@ describe("viz prompt conditionals", {
     ds <- local_data_frame_source(new_test_df())
     sp <- QueryChatSystemPrompt$new(
       prompt_template = default_prompt(),
-      data_source = ds
+      data_sources = list(test_table = ds)
     )
     rendered <- sp$render(tools = c("visualize"))
     expect_no_match(rendered, "Avoid redundant expanded results")
   })
 })
-
-describe("Schema inference skip", {
-  skip_if_no_dataframe_engine()
-
-  it("skips schema when template doesn't reference {{schema}}", {
-    df <- new_test_df()
-    ds <- DataFrameSource$new(df, "test_table")
-    withr::defer(ds$cleanup())
-
-    sp <- QueryChatSystemPrompt$new(
-      prompt_template = "No schema here: {{db_type}}",
-      data_source = ds
-    )
-
-    expect_equal(sp$schema, "")
-  })
-
-  it("computes schema when template uses {{schema}}", {
-    df <- new_test_df()
-    ds <- DataFrameSource$new(df, "test_table")
-    withr::defer(ds$cleanup())
-
-    sp <- QueryChatSystemPrompt$new(
-      prompt_template = "Schema: {{schema}}",
-      data_source = ds
-    )
-
-    expect_true(nchar(sp$schema) > 0)
-    expect_match(sp$schema, "test_table")
-  })
-
-  it("computes schema for {{{schema}}} triple braces", {
-    df <- new_test_df()
-    ds <- DataFrameSource$new(df, "test_table")
-    withr::defer(ds$cleanup())
-
-    sp <- QueryChatSystemPrompt$new(
-      prompt_template = "Schema: {{{schema}}}",
-      data_source = ds
-    )
-
-    expect_true(nchar(sp$schema) > 0)
-  })
-
-  it("computes schema for {{#schema}} conditional sections", {
-    df <- new_test_df()
-    ds <- DataFrameSource$new(df, "test_table")
-    withr::defer(ds$cleanup())
-
-    sp <- QueryChatSystemPrompt$new(
-      prompt_template = "{{#schema}}Has schema{{/schema}}",
-      data_source = ds
-    )
-
-    expect_true(nchar(sp$schema) > 0)
-  })
-})
diff --git a/pkg-r/tests/testthat/test-QueryExecutor.R b/pkg-r/tests/testthat/test-QueryExecutor.R
new file mode 100644
index 000000000..ca922c74f
--- /dev/null
+++ b/pkg-r/tests/testthat/test-QueryExecutor.R
@@ -0,0 +1,188 @@
+describe("DataSourceExecutor", {
+  skip_if_not_installed("duckdb")
+
+  users_source <- local_data_frame_source(new_users_df(), "users")
+  sources <- list(users = users_source)
+  executor <- DataSourceExecutor$new(sources)
+
+  it("delegates execute_query() to primary source", {
+    result <- executor$execute_query("SELECT * FROM users WHERE age > 28")
+    expect_s3_class(result, "data.frame")
+    expect_equal(nrow(result), 3)
+  })
+
+  it("delegates test_query() to the named source", {
+    result <- executor$test_query("SELECT * FROM users", "users")
+    expect_s3_class(result, "data.frame")
+    expect_equal(nrow(result), 1)
+  })
+
+  it("returns correct get_db_type()", {
+    expect_equal(executor$get_db_type(), "DuckDB")
+  })
+
+  it("gets schema for a named table", {
+    schema <- executor$get_schema("users", categorical_threshold = 20)
+    expect_type(schema, "character")
+    expect_match(schema, "Table: users")
+    expect_match(schema, "id")
+    expect_match(schema, "name")
+    expect_match(schema, "age")
+  })
+})
+
+describe("DuckDBExecutor", {
+  skip_if_not_installed("duckdb")
+
+  it("registers multiple data frames for cross-table JOINs", {
+    users <- new_users_df()
+    scores <- data.frame(
+      id = 1:5,
+      score = c(90, 85, 92, 78, 88),
+      stringsAsFactors = FALSE
+    )
+    dataframes <- list(users = users, scores = scores)
+    executor <- DuckDBExecutor$new(dataframes)
+    withr::defer(executor$cleanup())
+
+    result <- executor$execute_query(
+      "SELECT u.name, s.score FROM users u JOIN scores s ON u.id = s.id"
+    )
+    expect_s3_class(result, "data.frame")
+    expect_equal(nrow(result), 5)
+    expect_true("name" %in% names(result))
+    expect_true("score" %in% names(result))
+  })
+
+  it("enforces require_all_columns per table in test_query()", {
+    users <- new_users_df()
+    dataframes <- list(users = users)
+    executor <- DuckDBExecutor$new(dataframes)
+    withr::defer(executor$cleanup())
+
+    # Query that drops a column should fail with require_all_columns = TRUE
+    expect_error(
+      executor$test_query(
+        "SELECT id, name FROM users",
+        "users",
+        require_all_columns = TRUE
+      ),
+      class = "querychat_missing_columns_error"
+    )
+
+    # Full select should pass
+    expect_no_error(
+      executor$test_query(
+        "SELECT * FROM users",
+        "users",
+        require_all_columns = TRUE
+      )
+    )
+  })
+
+  it("locks down the connection (DDL like CREATE TABLE should fail)", {
+    users <- new_users_df()
+    dataframes <- list(users = users)
+    executor <- DuckDBExecutor$new(dataframes)
+    withr::defer(executor$cleanup())
+
+    expect_error(
+      executor$execute_query("CREATE TABLE new_table (id INTEGER)")
+    )
+  })
+
+  it("returns correct get_db_type()", {
+    executor <- DuckDBExecutor$new(list(users = new_users_df()))
+    withr::defer(executor$cleanup())
+
+    expect_equal(executor$get_db_type(), "DuckDB")
+  })
+
+  it("gets schema for a named table", {
+    executor <- DuckDBExecutor$new(list(users = new_users_df()))
+    withr::defer(executor$cleanup())
+
+    schema <- executor$get_schema("users", categorical_threshold = 20)
+    expect_type(schema, "character")
+    expect_match(schema, "Table: users")
+    expect_match(schema, "id")
+    expect_match(schema, "name")
+    expect_match(schema, "age")
+  })
+})
+
+describe("build_query_executor()", {
+  skip_if_not_installed("duckdb")
+
+  it("returns DataSourceExecutor for a single table", {
+    sources <- list(users = local_data_frame_source(new_users_df(), "users"))
+    executor <- build_query_executor(sources)
+
+    expect_s3_class(executor, "DataSourceExecutor")
+    expect_s3_class(executor, "QueryExecutor")
+  })
+
+  it("returns DuckDBExecutor for multiple DataFrameSources", {
+    sources <- list(
+      users = local_data_frame_source(new_users_df(), "users"),
+      test = local_data_frame_source(new_test_df(), "test")
+    )
+    executor <- build_query_executor(sources)
+    withr::defer(executor$cleanup())
+
+    expect_s3_class(executor, "DuckDBExecutor")
+    expect_s3_class(executor, "QueryExecutor")
+  })
+
+  it("returns DataSourceExecutor for multiple DBISources sharing same connection", {
+    skip_if_not_installed("RSQLite")
+
+    conn <- DBI::dbConnect(RSQLite::SQLite(), ":memory:")
+    withr::defer(DBI::dbDisconnect(conn))
+
+    DBI::dbWriteTable(conn, "users", new_users_df())
+    DBI::dbWriteTable(conn, "test_table", new_test_df())
+
+    sources <- list(
+      users = DBISource$new(conn, "users"),
+      test_table = DBISource$new(conn, "test_table")
+    )
+    executor <- build_query_executor(sources)
+
+    expect_s3_class(executor, "DataSourceExecutor")
+    expect_s3_class(executor, "QueryExecutor")
+  })
+})
+
+describe("check_source_compatibility()", {
+  skip_if_not_installed("duckdb")
+
+  it("accepts compatible DataFrameSources", {
+    source1 <- local_data_frame_source(new_users_df(), "users")
+    source2 <- local_data_frame_source(new_test_df(), "test")
+
+    existing <- list(users = source1)
+    expect_no_error(check_source_compatibility(existing, source2, "test"))
+  })
+
+  it("accepts an empty existing list (first table)", {
+    source1 <- local_data_frame_source(new_users_df(), "users")
+    expect_no_error(check_source_compatibility(list(), source1, "users"))
+  })
+
+  it("rejects mixed source types (DataFrameSource + DBISource)", {
+    skip_if_not_installed("RSQLite")
+
+    df_source <- local_data_frame_source(new_users_df(), "users")
+
+    conn <- DBI::dbConnect(RSQLite::SQLite(), ":memory:")
+    withr::defer(DBI::dbDisconnect(conn))
+    DBI::dbWriteTable(conn, "test_table", new_test_df())
+    dbi_source <- DBISource$new(conn, "test_table")
+
+    existing <- list(users = df_source)
+    expect_error(
+      check_source_compatibility(existing, dbi_source, "test_table")
+    )
+  })
+})
diff --git a/pkg-r/tests/testthat/test-querychat_module.R b/pkg-r/tests/testthat/test-querychat_module.R
index 99ae477f9..040db90f5 100644
--- a/pkg-r/tests/testthat/test-querychat_module.R
+++ b/pkg-r/tests/testthat/test-querychat_module.R
@@ -17,10 +17,125 @@ test_that("Shiny app example loads without errors", {
   })
 })
 
+test_that("mod_server() return includes table() and table_names() for single-table", {
+  skip_if_no_dataframe_engine()
+
+  ds <- local_data_frame_source(new_test_df())
+  executor <- build_query_executor(list(test_table = ds))
+  withr::defer(executor$cleanup())
+
+  client_factory <- function(...) structure(list(), class = "MockChat")
+
+  shiny::testServer(
+    mod_server,
+    args = list(
+      id = "test",
+      data_sources = list(test_table = ds),
+      executor = executor,
+      greeting = "Hello",
+      client = client_factory,
+      tools = "query",
+      enable_bookmarking = FALSE
+    ),
+    {
+      # table_names_fn() returns the table name vector
+      expect_equal(table_names_fn(), "test_table")
+
+      # table_fn() returns a TableAccessor backed by reactive state
+      acc <- table_fn("test_table")
+      expect_true(inherits(acc, "TableAccessor"))
+      expect_equal(acc$table_name, "test_table")
+
+      # TableAccessor$df() works (returns the full data frame when no filter set)
+      df_result <- shiny::isolate(acc$df())
+      expect_equal(nrow(df_result), 5L)
+
+      # Single-table backward compat: first$df/sql/title are still in the return
+      first_state <- tables[[1]]
+      expect_true(is.function(first_state$df))
+      expect_true(is.function(first_state$sql))
+      expect_true(is.function(first_state$title))
+
+      # Verify the returned list exposes table() and table_names()
+      expect_true(is.function(session$returned$table))
+      expect_true(is.function(session$returned$table_names))
+      acc <- session$returned$table("test_table")
+      expect_s3_class(acc, "TableAccessor")
+      expect_equal(session$returned$table_names(), "test_table")
+
+      # Verify backward-compat reactive accessors on the returned list
+      expect_true(is.function(session$returned$df))
+      expect_true(is.function(session$returned$sql))
+      expect_true(is.function(session$returned$title))
+    }
+  )
+})
+
+test_that("mod_server() return includes table() and table_names() for multi-table", {
+  skip_if_no_dataframe_engine()
+
+  ds1 <- local_data_frame_source(new_test_df(), table_name = "tbl_a")
+  ds2 <- local_data_frame_source(new_test_df(), table_name = "tbl_b")
+  data_sources <- list(tbl_a = ds1, tbl_b = ds2)
+  executor <- build_query_executor(data_sources)
+  withr::defer(executor$cleanup())
+
+  result <- NULL
+  client_factory <- function(...) {
+    result <<- "client_called"
+    structure(list(), class = "MockChat")
+  }
+
+  shiny::testServer(
+    mod_server,
+    args = list(
+      id = "test",
+      data_sources = data_sources,
+      executor = executor,
+      greeting = "Hello",
+      client = client_factory,
+      tools = "query",
+      enable_bookmarking = FALSE
+    ),
+    {
+      # table_names_fn() returns all registered table names
+      expect_equal(table_names_fn(), c("tbl_a", "tbl_b"))
+
+      # table_fn() returns a TableAccessor for each table
+      acc_a <- table_fn("tbl_a")
+      expect_true(inherits(acc_a, "TableAccessor"))
+      expect_equal(acc_a$table_name, "tbl_a")
+
+      acc_b <- table_fn("tbl_b")
+      expect_true(inherits(acc_b, "TableAccessor"))
+      expect_equal(acc_b$table_name, "tbl_b")
+
+      # table_fn() errors for unknown names
+      expect_error(table_fn("nonexistent"), class = "rlang_error")
+
+      # Multi-table: single_table_error functions mention qc_vals$table()
+      single_err <- single_table_error("sql")
+      expect_error(single_err(), regexp = "qc_vals\\$table")
+
+      # Verify the returned list exposes table() and table_names()
+      expect_true(is.function(session$returned$table))
+      expect_true(is.function(session$returned$table_names))
+      acc <- session$returned$table("tbl_a")
+      expect_s3_class(acc, "TableAccessor")
+      expect_equal(sort(session$returned$table_names()), c("tbl_a", "tbl_b"))
+
+      # Verify error is surfaced through the public API
+      expect_error(session$returned$table("nonexistent"), "not found")
+    }
+  )
+})
+
 test_that("mod_server() passes visualize callback and tools to client factory", {
   skip_if_no_dataframe_engine()
 
   ds <- local_data_frame_source(new_test_df())
+  executor <- build_query_executor(list(test_table = ds))
+  withr::defer(executor$cleanup())
   captured <- NULL
 
   client_factory <- function(...) {
@@ -32,7 +147,8 @@ test_that("mod_server() passes visualize callback and tools to client factory",
     mod_server,
     args = list(
       id = "test",
-      data_source = ds,
+      data_sources = list(test_table = ds),
+      executor = executor,
       greeting = "Hello",
       client = client_factory,
       tools = c("query", "visualize"),
@@ -48,6 +164,80 @@ test_that("mod_server() passes visualize callback and tools to client factory",
   )
 })
 
+test_that("mod_server() exposes current_table() starting as NULL", {
+  skip_if_no_dataframe_engine()
+
+  ds <- local_data_frame_source(new_test_df())
+  executor <- build_query_executor(list(test_table = ds))
+  withr::defer(executor$cleanup())
+
+  client_factory <- function(...) structure(list(), class = "MockChat")
+
+  shiny::testServer(
+    mod_server,
+    args = list(
+      id = "test",
+      data_sources = list(test_table = ds),
+      executor = executor,
+      greeting = "Hello",
+      client = client_factory,
+      tools = "query",
+      enable_bookmarking = FALSE
+    ),
+    {
+      expect_true(is.function(session$returned$current_table))
+      expect_null(shiny::isolate(session$returned$current_table()))
+    }
+  )
+})
+
+test_that("mod_server() current_table() updates on update_dashboard and reset_query", {
+  skip_if_no_dataframe_engine()
+
+  ds1 <- local_data_frame_source(new_test_df(), table_name = "tbl_a")
+  ds2 <- local_data_frame_source(new_test_df(), table_name = "tbl_b")
+  data_sources <- list(tbl_a = ds1, tbl_b = ds2)
+  executor <- build_query_executor(data_sources)
+  withr::defer(executor$cleanup())
+
+  captured_callbacks <- NULL
+  client_factory <- function(...) {
+    captured_callbacks <<- list(...)
+    structure(list(), class = "MockChat")
+  }
+
+  shiny::testServer(
+    mod_server,
+    args = list(
+      id = "test",
+      data_sources = data_sources,
+      executor = executor,
+      greeting = "Hello",
+      client = client_factory,
+      tools = "query",
+      enable_bookmarking = FALSE
+    ),
+    {
+      # Initially NULL
+      expect_null(shiny::isolate(session$returned$current_table()))
+
+      # update_dashboard sets it
+      shiny::isolate(
+        captured_callbacks$update_dashboard(
+          query = "SELECT * FROM tbl_a",
+          title = "All of tbl_a",
+          table = "tbl_a"
+        )
+      )
+      expect_equal(shiny::isolate(session$returned$current_table()), "tbl_a")
+
+      # reset_dashboard also sets it
+      shiny::isolate(captured_callbacks$reset_dashboard("tbl_b"))
+      expect_equal(shiny::isolate(session$returned$current_table()), "tbl_b")
+    }
+  )
+})
+
 test_that("mod_ui() passes allow_attachments = TRUE to shinychat by default", {
   captured <- NULL
   local_mocked_bindings(
@@ -78,6 +268,8 @@ test_that("restored viz widgets survive a second bookmark cycle", {
   skip_if_no_dataframe_engine()
 
   ds <- local_data_frame_source(new_test_df())
+  executor <- build_query_executor(list(test_table = ds))
+  withr::defer(executor$cleanup())
   callbacks <- NULL
   bookmark_fn <- NULL
   restore_fn <- NULL
@@ -89,7 +281,7 @@ test_that("restored viz widgets survive a second bookmark cycle", {
   }
 
   local_mocked_bindings(
-    chat_restore = function(id, chat, session) {},
+    chat_restore = function(id, chat, ..., session) {},
     .package = "shinychat"
   )
   local_mocked_bindings(
@@ -102,9 +294,9 @@ test_that("restored viz widgets survive a second bookmark cycle", {
     .package = "shiny"
   )
   local_mocked_bindings(
-    restore_viz_widgets = function(data_source, saved_widgets, session) {
+    restore_viz_widgets = function(executor, saved_widgets, session) {
       restored_args <<- list(
-        data_source = data_source,
+        executor = executor,
         saved_widgets = saved_widgets,
         session = session
       )
@@ -117,7 +309,8 @@ test_that("restored viz widgets survive a second bookmark cycle", {
     mod_server,
     args = list(
       id = "test",
-      data_source = ds,
+      data_sources = list(test_table = ds),
+      executor = executor,
       greeting = "Hello",
       client = client_factory,
       tools = c("query", "visualize"),
@@ -145,7 +338,7 @@ test_that("restored viz widgets survive a second bookmark cycle", {
       restore_state <- new.env(parent = emptyenv())
       restore_state$values <- first_state$values
       shiny::isolate(restore_fn(restore_state))
-      expect_identical(restored_args$data_source, ds)
+      expect_true(inherits(restored_args$executor, "QueryExecutor"))
       expect_equal(restored_args$saved_widgets, saved)
 
       second_state <- new.env(parent = emptyenv())
diff --git a/pkg-r/tests/testthat/test-querychat_tools.R b/pkg-r/tests/testthat/test-querychat_tools.R
index 46bb2b22d..893c08dac 100644
--- a/pkg-r/tests/testthat/test-querychat_tools.R
+++ b/pkg-r/tests/testthat/test-querychat_tools.R
@@ -1,22 +1,35 @@
-test_that("tool_update_dashboard() checks inputs", {
-  skip_if_no_dataframe_engine()
+local_executor <- function(df_source, env = parent.frame()) {
+  executor <- build_query_executor(list(test_table = df_source))
+  withr::defer(executor$cleanup(), envir = env)
+  executor
+}
 
-  expect_snapshot(error = TRUE, tool_update_dashboard("foo"))
+test_that("tool_update_dashboard() checks update_fn inputs", {
+  skip_if_no_dataframe_engine()
 
   df_source <- local_data_frame_source(new_test_df())
+  executor <- local_executor(df_source)
+
   expect_snapshot(error = TRUE, {
-    tool_update_dashboard(df_source, update_fn = NULL)
-    tool_update_dashboard(df_source, update_fn = function(query) {})
-    tool_update_dashboard(df_source, update_fn = function(title, extra) {})
+    tool_update_dashboard(executor, "test_table", update_fn = NULL)
+    tool_update_dashboard(
+      executor,
+      "test_table",
+      update_fn = function(query) {}
+    )
+    tool_update_dashboard(
+      executor,
+      "test_table",
+      update_fn = function(title, extra) {}
+    )
   })
 })
 
 test_that("tool_reset_dashboard() checks inputs", {
-  expect_snapshot(error = TRUE, tool_reset_dashboard("not_a_function"))
-})
-
-test_that("tool_query() checks inputs", {
-  expect_snapshot(error = TRUE, tool_query("invalid_source"))
+  expect_snapshot(
+    error = TRUE,
+    tool_reset_dashboard("not_a_function", table_names = "t")
+  )
 })
 
 describe("querychat_tool_starts_open()", {
@@ -94,9 +107,10 @@ describe("querychat_tool_result()", {
 
   it("returns successful result for valid query action", {
     df_source <- local_data_frame_source(new_test_df())
+    executor <- local_executor(df_source)
 
     result <- querychat_tool_result(
-      df_source,
+      executor,
       query = "SELECT * FROM test_table WHERE id = 1",
       action = "query"
     )
@@ -109,12 +123,14 @@ describe("querychat_tool_result()", {
 
   it("returns successful result for valid update action", {
     df_source <- local_data_frame_source(new_test_df())
+    executor <- local_executor(df_source)
 
     result <- querychat_tool_result(
-      df_source,
+      executor,
       query = "SELECT * FROM test_table WHERE value > 20",
       title = "High values",
-      action = "update"
+      action = "update",
+      table_name = "test_table"
     )
 
     expect_s7_class(result, ellmer::ContentToolResult)
@@ -127,9 +143,10 @@ describe("querychat_tool_result()", {
 
   it("returns successful result for reset action", {
     df_source <- local_data_frame_source(new_test_df())
+    executor <- local_executor(df_source)
 
     result <- querychat_tool_result(
-      df_source,
+      executor,
       query = NULL,
       action = "reset"
     )
@@ -141,9 +158,10 @@ describe("querychat_tool_result()", {
 
   it("handles query errors appropriately", {
     df_source <- local_data_frame_source(new_test_df())
+    executor <- local_executor(df_source)
 
     result <- querychat_tool_result(
-      df_source,
+      executor,
       query = "SELECT * FROM nonexistent_table",
       action = "query"
     )
@@ -155,11 +173,13 @@ describe("querychat_tool_result()", {
 
   it("handles update errors appropriately", {
     df_source <- local_data_frame_source(new_test_df())
+    executor <- local_executor(df_source)
 
     result <- querychat_tool_result(
-      df_source,
+      executor,
       query = "INVALID SQL",
-      action = "update"
+      action = "update",
+      table_name = "test_table"
     )
 
     expect_s7_class(result, ellmer::ContentToolResult)
@@ -169,9 +189,10 @@ describe("querychat_tool_result()", {
 
   it("formats query results with details block", {
     df_source <- local_data_frame_source(new_test_df())
+    executor <- local_executor(df_source)
 
     result <- querychat_tool_result(
-      df_source,
+      executor,
       query = "SELECT * FROM test_table LIMIT 1",
       action = "query"
     )
@@ -185,12 +206,14 @@ describe("querychat_tool_result()", {
 
   it("formats update results with button HTML", {
     df_source <- local_data_frame_source(new_test_df())
+    executor <- local_executor(df_source)
 
     result <- querychat_tool_result(
-      df_source,
+      executor,
       query = "SELECT * FROM test_table",
       title = "Test Filter",
-      action = "update"
+      action = "update",
+      table_name = "test_table"
     )
 
     markdown <- result@extra$display$markdown
@@ -204,9 +227,10 @@ describe("querychat_tool_result()", {
 
   it("formats reset results with button HTML", {
     df_source <- local_data_frame_source(new_test_df())
+    executor <- local_executor(df_source)
 
     result <- querychat_tool_result(
-      df_source,
+      executor,
       query = NULL,
       action = "reset"
     )
@@ -218,12 +242,14 @@ describe("querychat_tool_result()", {
 
   it("includes title in extra display metadata for update action", {
     df_source <- local_data_frame_source(new_test_df())
+    executor <- local_executor(df_source)
 
     result <- querychat_tool_result(
-      df_source,
+      executor,
       query = "SELECT * FROM test_table",
       title = "Custom Title",
-      action = "update"
+      action = "update",
+      table_name = "test_table"
     )
 
     expect_equal(result@extra$display$title, "Custom Title")
@@ -231,9 +257,10 @@ describe("querychat_tool_result()", {
 
   it("does not include title for query action", {
     df_source <- local_data_frame_source(new_test_df())
+    executor <- local_executor(df_source)
 
     result <- querychat_tool_result(
-      df_source,
+      executor,
       query = "SELECT * FROM test_table",
       title = "Should be ignored",
       action = "query"
@@ -244,17 +271,18 @@ describe("querychat_tool_result()", {
 
   it("sets open state based on action and tool details option", {
     df_source <- local_data_frame_source(new_test_df())
+    executor <- local_executor(df_source)
     withr::local_options(querychat.tool_details = NULL)
 
     query_result <- querychat_tool_result(
-      df_source,
+      executor,
       query = "SELECT * FROM test_table",
       action = "query"
     )
     expect_false(query_result@extra$display$open)
 
     reset_result <- querychat_tool_result(
-      df_source,
+      executor,
       query = NULL,
       action = "reset"
     )
@@ -263,9 +291,10 @@ describe("querychat_tool_result()", {
 
   it("shows request on error", {
     df_source <- local_data_frame_source(new_test_df())
+    executor <- local_executor(df_source)
 
     result <- querychat_tool_result(
-      df_source,
+      executor,
       query = "INVALID SQL",
       action = "query"
     )
@@ -275,9 +304,10 @@ describe("querychat_tool_result()", {
 
   it("hides request on success", {
     df_source <- local_data_frame_source(new_test_df())
+    executor <- local_executor(df_source)
 
     result <- querychat_tool_result(
-      df_source,
+      executor,
       query = "SELECT * FROM test_table",
       action = "query"
     )
@@ -291,7 +321,8 @@ describe("tool_query()", {
 
   it("returns an ellmer tool object", {
     df_source <- local_data_frame_source(new_test_df())
-    tool <- tool_query(df_source)
+    executor <- local_executor(df_source)
+    tool <- tool_query(executor)
 
     expect_s3_class(tool, "ellmer::ToolDef")
     expect_equal(tool@name, "querychat_query")
@@ -299,7 +330,8 @@ describe("tool_query()", {
 
   it("includes database type in description", {
     df_source <- local_data_frame_source(new_test_df())
-    tool <- tool_query(df_source)
+    executor <- local_executor(df_source)
+    tool <- tool_query(executor)
 
     # DataFrameSource uses DuckDB
     expect_match(tool@description, "DuckDB|duckdb", ignore.case = TRUE)
@@ -307,7 +339,8 @@ describe("tool_query()", {
 
   it("creates a working tool function", {
     df_source <- local_data_frame_source(new_test_df())
-    tool <- tool_query(df_source)
+    executor <- local_executor(df_source)
+    tool <- tool_query(executor)
 
     # Execute the tool function
     result <- tool(query = "SELECT * FROM test_table LIMIT 1")
@@ -322,8 +355,13 @@ describe("tool_update_dashboard()", {
 
   it("returns an ellmer tool object", {
     df_source <- local_data_frame_source(new_test_df())
+    executor <- local_executor(df_source)
 
-    tool <- tool_update_dashboard(df_source)
+    tool <- tool_update_dashboard(
+      executor,
+      table_names = "test_table",
+      update_fn = function(query, title, table) {}
+    )
 
     expect_s3_class(tool, "ellmer::ToolDef")
     expect_equal(tool@name, "querychat_update_dashboard")
@@ -331,8 +369,13 @@ describe("tool_update_dashboard()", {
 
   it("includes database type in description", {
     df_source <- local_data_frame_source(new_test_df())
+    executor <- local_executor(df_source)
 
-    tool <- tool_update_dashboard(df_source)
+    tool <- tool_update_dashboard(
+      executor,
+      table_names = "test_table",
+      update_fn = function(query, title, table) {}
+    )
 
     # DataFrameSource uses DuckDB
     expect_match(tool@description, "DuckDB|duckdb", ignore.case = TRUE)
@@ -340,40 +383,47 @@ describe("tool_update_dashboard()", {
 
   it("creates a working tool function", {
     df_source <- local_data_frame_source(new_test_df())
+    executor <- local_executor(df_source)
 
     res_update <- NULL
-    tool <- tool_update_dashboard(df_source, function(query, title) {
-      res_update <<- list(query = query, title = title)
-    })
+    tool <- tool_update_dashboard(
+      executor,
+      table_names = "test_table",
+      update_fn = function(query, title, table) {
+        res_update <<- list(query = query, title = title, table = table)
+      }
+    )
 
     res_tool <- tool(
       query = "SELECT * FROM test_table WHERE id > 2",
-      title = "Filtered View"
+      title = "Filtered View",
+      table = "test_table"
     )
 
     expect_s7_class(res_tool, ellmer::ContentToolResult)
     expect_equal(res_update$query, "SELECT * FROM test_table WHERE id > 2")
     expect_equal(res_update$title, "Filtered View")
+    expect_equal(res_update$table, "test_table")
   })
 })
 
 describe("tool_reset_dashboard()", {
-  reset_fn <- function() {
-    "Reset executed"
-  }
-
   it("returns an ellmer tool object", {
-    tool <- tool_reset_dashboard(reset_fn)
+    tool <- tool_reset_dashboard(
+      reset_fn = function(table) {},
+      table_names = c("test_table")
+    )
 
     expect_s3_class(tool, "ellmer::ToolDef")
     expect_equal(tool@name, "querychat_reset_dashboard")
   })
 
   it("uses the provided reset function", {
-    tool <- tool_reset_dashboard(reset_fn)
+    reset_fn <- function(table) paste("Reset executed for", table)
+    tool <- tool_reset_dashboard(reset_fn, table_names = c("test_table"))
 
     expect_s3_class(tool, "ellmer::ToolDef")
-    expect_equal(tool(), "Reset executed")
+    expect_equal(tool("test_table"), "Reset executed for test_table")
   })
 })
 
@@ -382,43 +432,59 @@ describe("tool_update_dashboard_impl()", {
 
   it("returns a function", {
     df_source <- local_data_frame_source(new_test_df())
-    current_query <- shiny::reactiveVal("SELECT * FROM test_table")
-    current_title <- shiny::reactiveVal("All Data")
+    executor <- local_executor(df_source)
 
-    impl_fn <- tool_update_dashboard_impl(df_source)
+    impl_fn <- tool_update_dashboard_impl(
+      executor,
+      table_names = "test_table",
+      update_fn = function(query, title, table) {}
+    )
 
     expect_type(impl_fn, "closure")
   })
 
   it("updates reactive values on successful query", {
     df_source <- local_data_frame_source(new_test_df())
+    executor <- local_executor(df_source)
 
     res_update <- NULL
-    impl_fn <- tool_update_dashboard_impl(df_source, function(query, title) {
-      res_update <<- list(query = query, title = title)
-    })
+    impl_fn <- tool_update_dashboard_impl(
+      executor,
+      table_names = "test_table",
+      update_fn = function(query, title, table) {
+        res_update <<- list(query = query, title = title, table = table)
+      }
+    )
 
     res_tool <- impl_fn(
       query = "SELECT * FROM test_table WHERE id < 3",
-      title = "First Two"
+      title = "First Two",
+      table = "test_table"
     )
 
     expect_equal(res_update$query, "SELECT * FROM test_table WHERE id < 3")
     expect_equal(res_update$title, "First Two")
+    expect_equal(res_update$table, "test_table")
     expect_null(res_tool@error)
   })
 
   it("does not update reactive values on query error", {
     df_source <- local_data_frame_source(new_test_df())
+    executor <- local_executor(df_source)
 
     res_update <- NULL
-    impl_fn <- tool_update_dashboard_impl(df_source, function(query, title) {
-      res_update <<- list(query = query, title = title)
-    })
+    impl_fn <- tool_update_dashboard_impl(
+      executor,
+      table_names = "test_table",
+      update_fn = function(query, title, table) {
+        res_update <<- list(query = query, title = title, table = table)
+      }
+    )
 
     res_tool <- impl_fn(
       query = "INVALID SQL",
-      title = "Should Not Update"
+      title = "Should Not Update",
+      table = "test_table"
     )
 
     # `update_fn` was not called
@@ -427,3 +493,39 @@ describe("tool_update_dashboard_impl()", {
     expect_s3_class(res_tool@error, class = "error")
   })
 })
+
+describe("get_schema_result_display()", {
+  it("returns a sentinel span with data-table attribute", {
+    result <- GetSchemaResult(
+      value = "Table: orders\nColumns:\n- id (INTEGER)",
+      table_name = "orders"
+    )
+    html <- get_schema_result_display(result)
+    html_str <- as.character(html)
+    expect_true(grepl("qc-schema-collector", html_str))
+    expect_true(grepl('data-table="orders"', html_str))
+    expect_true(
+      grepl("display:none", html_str) || grepl("display: none", html_str)
+    )
+  })
+
+  it("embeds schema text in data-schema attribute", {
+    schema <- "Table: orders\nColumns:\n- id (INTEGER)"
+    result <- GetSchemaResult(value = schema, table_name = "orders")
+    html <- get_schema_result_display(result)
+    html_str <- as.character(html)
+    expect_true(grepl("data-schema", html_str))
+    expect_true(grepl("orders", html_str))
+  })
+
+  it("includes querychat-schema-display HTML dependency", {
+    result <- GetSchemaResult(
+      value = "Table: t\nColumns:\n- x (TEXT)",
+      table_name = "t"
+    )
+    html <- get_schema_result_display(result)
+    deps <- htmltools::findDependencies(html)
+    dep_names <- vapply(deps, function(d) d$name, character(1))
+    expect_true("querychat-schema-display" %in% dep_names)
+  })
+})
diff --git a/pkg-r/tests/testthat/test-viz-tool.R b/pkg-r/tests/testthat/test-viz-tool.R
index ed5104541..89964ff0c 100644
--- a/pkg-r/tests/testthat/test-viz-tool.R
+++ b/pkg-r/tests/testthat/test-viz-tool.R
@@ -134,10 +134,12 @@ describe("tool_visualize_dashboard()", {
         callback_data <<- data
       }
     )
-    suppressWarnings(tool(
-      ggsql = "SELECT * FROM test_table VISUALISE value AS x DRAW histogram",
-      title = "Test"
-    ))
+    suppressWarnings(
+      tool(
+        ggsql = "SELECT * FROM test_table VISUALISE value AS x DRAW histogram",
+        title = "Test"
+      )
+    )
     expect_type(callback_data, "list")
     expect_true(all(c("ggsql", "title", "widget_id") %in% names(callback_data)))
     expect_identical(footer_data$dom_widget_id, footer_data[[3]])
@@ -365,10 +367,12 @@ describe("tool_visualize_dashboard()", {
       update_fn = function(data) {}
     )
 
-    suppressWarnings(tool(
-      ggsql = "SELECT * FROM test_table VISUALISE value AS x DRAW histogram",
-      title = "Test"
-    ))
+    suppressWarnings(
+      tool(
+        ggsql = "SELECT * FROM test_table VISUALISE value AS x DRAW histogram",
+        title = "Test"
+      )
+    )
 
     expect_identical(
       footer_data$dom_widget_id,
diff --git a/pkg-r/vignettes/build.Rmd b/pkg-r/vignettes/build.Rmd
index 860cea0f7..54ed3f5fa 100644
--- a/pkg-r/vignettes/build.Rmd
+++ b/pkg-r/vignettes/build.Rmd
@@ -15,23 +15,16 @@ knitr::opts_chunk$set(
 )
 ```
 
-While `querychat_app()` provides a quick way to start exploring data, building bespoke Shiny apps with querychat unlocks the full power of integrating natural language data exploration with custom visualizations, layouts, and interactivity. This guide shows you how to integrate querychat into your own Shiny applications and leverage its reactive data outputs to create rich, interactive dashboards.
+While `querychat_app()` provides a quick way to start exploring data, building bespoke Shiny apps with querychat unlocks the full power of integrating natural language data exploration with custom visualizations, layouts, and interactivity. This guide shows you how to integrate querychat into your own Shiny applications and leverage its reactive data outputs to create rich, interactive experiences.
 
-querychat is a particularly good fit for Shiny apps that have:
-
-1. **A single data source** (or a set of related tables that can be joined)
-2. **Multiple filters** that let users slice and explore the data in different ways
-3. **Several visualizations and outputs** that all depend on the same filtered data
-
-In these apps, querychat can replace or augment your filtering UI by allowing users to describe what they want to see in natural language. Instead of building complex filter controls, users can simply ask questions like "show me customers from California who spent over $1000 last quarter" and querychat will generate the appropriate SQL query.
+querychat lets users ask questions of their data in plain language — filtering, sorting, summarizing, joining across tables, and creating visualizations — all without needing to write SQL or navigate complex filter UIs. You can use it as the primary exploration interface in a standalone app, or embed it alongside curated views in an existing dashboard to let users go deeper than the views you designed.
 
 This is especially valuable when:
 
 - Your data has many columns and building a UI for all possible filters would be overwhelming
 - Users want to explore ad-hoc combinations of filters that you didn't anticipate
-- You want to make data exploration more accessible to users who aren't comfortable with traditional filtering UIs
-
-If you have an existing app with a reactive data frame that flows through multiple outputs, querychat can be a natural addition to provide an alternative way to filter that data.
+- You have multiple related tables that users may want to query and join
+- You want to make data exploration more accessible to non-technical users
 
 
 ## Starter template
@@ -419,18 +412,75 @@ This is equivalent to the user asking the LLM to "reset" or "show all data".
 
 ## Multiple tables
 
-Currently, you have two options for exploring multiple tables in querychat:
+querychat can work with multiple related tables in a single chat interface, letting users query across tables, join data, and filter any table independently. Register additional tables with `$add_table()` after creating the `QueryChat` instance, then access per-table state through the `$table()` method.
 
-1. Join the tables into a single table before passing to querychat
-2. Use multiple querychat instances in the same app
+### Registering tables
 
-The first option makes it possible to chat with multiple tables inside a single chat interface, whereas the second option requires a separate chat interface for each table.
+Pass the first table when creating `QueryChat`, then call `$add_table()` for each additional table:
 
-::: {.alert .alert-info}
-### Multiple filtered tables
+```{r}
+library(querychat)
 
-We do intend on supporting multiple filtered tables in a future release -- if you're interested in this feature, please upvote [the relevant issue](https://github.com/posit-dev/querychat/issues/6)
-:::
+qc <- QueryChat$new(orders, "orders")
+qc$add_table(customers, "customers")
+qc$add_table(products, "products")
+```
+
+The LLM can query any registered table and write joins across them. You can inspect which tables are registered with `qc$table_names()`.
+
+### Per-table reactive access
+
+When working with multiple tables, access filtered data and SQL for each table individually using `$table()`:
+
+```{r}
+server <- function(input, output, session) {
+  qc_vals <- qc$server()
+
+  output$orders_table <- renderDataTable({
+    qc_vals$table("orders")$df()
+  })
+
+  output$orders_sql <- renderText({
+    qc_vals$table("orders")$sql()
+  })
+
+  output$customers_table <- renderDataTable({
+    qc_vals$table("customers")$df()
+  })
+}
+```
+
+Each table has its own `$df()`, `$sql()`, and `$title()` reactives that update independently when the user filters that specific table.
+
+### Tracking the active table
+
+Use `$current_table()` to find out which table the LLM most recently queried. This is useful for auto-switching a tabbed UI to the relevant table:
+
+```{r}
+observe({
+  tbl <- qc_vals$current_table()
+  req(tbl)
+  nav_select("table_tabs", selected = tbl)
+})
+```
+
+### Data dictionary
+
+When working with multiple related tables, providing a [data dictionary](context.html#data-dictionary) is strongly recommended. It tells the LLM how tables relate to each other, which columns are keys, and what domain terms mean — all of which help it write accurate joins and queries.
+
+```{r}
+qc <- QueryChat$new(
+  orders, "orders",
+  data_dict = "data-dict.yaml"
+)
+qc$add_table(customers, "customers")
+```
+
+See [Provide context](context.html#data-dictionary) for the full data dictionary format.
+
+### Separate chat interfaces
+
+If your tables are truly independent (not related), you may prefer separate `QueryChat` instances, each with its own chat interface:
 
 <details>
 <summary> <code>app.R </code> </summary>
diff --git a/pkg-r/vignettes/context.Rmd b/pkg-r/vignettes/context.Rmd
index aac5efe8b..e66413cf5 100644
--- a/pkg-r/vignettes/context.Rmd
+++ b/pkg-r/vignettes/context.Rmd
@@ -15,70 +15,135 @@ knitr::opts_chunk$set(
 )
 ```
 
-querychat automatically gathers information about your table to help the LLM write accurate SQL queries. This includes column names and types, numerical ranges, and categorical value examples. (All of this information is provided to the LLM as part of the **system prompt** -- a string of text containing instructions and context for the LLM to consider when responding to user queries.)
+querychat automatically gathers schema information about your tables — column names, types, numerical ranges, and categorical values — and makes it available to the LLM on demand via the `querychat_get_schema` [tool](tools.html#schema-retrieval). The LLM calls this tool before writing SQL to understand the structure of the tables it's querying.
 
 Importantly, we are **not** sending your raw data to the LLM and asking it to do complicated math. The LLM only needs to understand the structure and schema of your data in order to write SQL queries.
 
-You can get even better results by customizing the system prompt in three ways:
+You can get even better results by providing additional context:
 
-1. Add a [data description](#data-description) to provide more context about what the data represents
-2. Add [custom instructions](#extra-instructions) to guide the LLM's behavior
-3. Use a fully [custom prompt template](#custom-template) if you want complete control (useful if you want to be certain the model cannot see any literal values from your data)
+1. Add a [data dictionary](#data-dictionary) to describe tables, columns, relationships, and domain terminology (recommended)
+2. Add a [data description](#data-description) for a simpler alternative when working with a single, straightforward table
+3. Add [custom instructions](#extra-instructions) to guide the LLM's behavior
+4. Use a fully [custom prompt template](#custom-template) if you want complete control
 
 ```{r}
 library(querychat)
 library(palmerpenguins)
 ```
 
-## Default prompt
+## Data dictionary {#data-dictionary}
 
-For full visibility into the system prompt that querychat generates for the LLM, you can inspect the `system_prompt` field. This is useful for debugging and understanding exactly what context the LLM is using:
+A **data dictionary** is a YAML file that describes your tables, columns, relationships, and domain-specific terminology. It's the recommended way to provide context, especially when working with [multiple tables](build.html#multiple-tables) or when your data has domain-specific meaning that isn't obvious from column names alone.
 
 ```{r}
-qc <- querychat(penguins)
-cat(qc$system_prompt)
+qc <- QueryChat$new(
+  orders, "orders",
+  data_dict = "data-dict.yaml"
+)
+qc$add_table(customers, "customers")
 ```
 
-By default, the system prompt contains the following components:
+### Format
+
+A data dictionary has three top-level sections: `tables`, `relationships`, and `glossary`.
+
+```yaml
+# data-dict.yaml
+version: "0.2.0"
+
+tables:
+  orders:
+    description: One row per customer order.
+    columns:
+      - name: order_id
+        type: number(id)
+        constraints: [primary_key]
+        description: Unique order identifier.
+      - name: customer_id
+        type: number(id)
+        constraints: [foreign_key]
+        description: References customers.id.
+      - name: total
+        type: number(quantity)
+        description: Order total in USD.
+      - name: status
+        type: enum
+        values: [pending, shipped, delivered, cancelled]
+        description: Current order status.
+
+  customers:
+    description: One row per customer.
+    columns:
+      - name: id
+        type: number(id)
+        constraints: [primary_key]
+        description: Unique customer identifier.
+      - name: name
+        type: string
+        description: Full name.
+      - name: region
+        type: string
+        description: Geographic sales region.
+
+relationships:
+  - description: Each order belongs to one customer.
+    cardinality: many-to-one
+    join: orders.customer_id = customers.id
+
+glossary:
+  AOV: Average order value — total revenue divided by number of orders.
+  churn: A customer who has not placed an order in the last 90 days.
+```
+
+#### Tables
+
+Each entry under `tables` describes one table. The key must match the table name you pass to `QueryChat$new()` or `$add_table()`.
+
+- **`description`**: What this table represents (one sentence is usually enough).
+- **`columns`**: A list of column annotations. Each column can have:
+  - `name`: Column name (must match the actual column)
+  - `type`: Semantic type hint — `string`, `number`, `number(id)`, `number(quantity)`, `date`, `enum`
+  - `constraints`: Optional list — `primary_key`, `foreign_key`
+  - `description`: What this column means in plain English
+  - `values`: For `enum` columns, the list of possible values
+
+Columns listed in the data dictionary are excluded from the auto-generated schema (since your description supersedes the auto-detected metadata). Columns not listed are still auto-detected as usual.
+
+#### Relationships
+
+The `relationships` section tells the LLM how to join tables. Each entry has:
+
+- `description`: A plain-English description of the relationship
+- `cardinality`: `one-to-one`, `one-to-many`, or `many-to-one`
+- `join`: The join condition (e.g., `orders.customer_id = customers.id`)
+
+#### Glossary
+
+The `glossary` section defines domain-specific terms that users might use in their questions. This helps the LLM translate business language into correct SQL.
 
-1. The basic set of behaviors and guidelines the LLM must follow in order for querychat to work properly, including how to use [tools](tools.html) to execute queries and update the app.
-2. The SQL schema of the data frame you provided. This includes:
-    - Column names
-    - Data types (integer, real, boolean, date/datetime, text)
-    - For text columns with less than 10 unique values, we assume they are categorical variables and include the list of values
-    - For integer and real columns, we include the range
-3. A [data description](#data-description) (if provided via `data_description`)
-4. [Additional instructions](#additional-instructions) you want to use to guide querychat's behavior (if provided via `extra_instructions`).
 
 ## Data description {#data-description}
 
-If your column names are descriptive, querychat may already work well without additional context. However, if your columns are named `x`, `V1`, `value`, etc., you should provide a data description. Use the `data_description` parameter for this:
+For simple single-table use cases where a full data dictionary would be overkill, you can provide a **data description** — a free-form markdown file or string that describes what the data represents. Use the `data_description` parameter:
 
 ```{r}
-qc <- querychat(
+qc <- QueryChat$new(
   penguins,
   data_description = "data_description.md"
 )
-
-cat(qc$system_prompt)
 ```
 
-querychat doesn't need this information in any particular format -- just provide what a human would find helpful:
+querychat doesn't need this in any particular format — just provide what a human would find helpful:
 
 ```markdown
 <!-- data_description.md -->
 
-This dataset contains information about Palmer Archipelago penguins,
-collected for studying penguin populations.
+This dataset contains information about Palmer Archipelago penguins.
 
 - species: Penguin species (Adelie, Chinstrap, Gentoo)
 - island: Island where observed (Torgersen, Biscoe, Dream)
 - bill_length_mm: Bill length in millimeters
-- bill_depth_mm: Bill depth in millimeters
-- flipper_length_mm: Flipper length in millimeters
 - body_mass_g: Body mass in grams
-- sex: Penguin sex (male, female)
-- year: Year of observation
 ```
 
 ## Additional instructions {#extra-instructions}
@@ -86,12 +151,10 @@ collected for studying penguin populations.
 You can add custom instructions to guide the LLM's behavior using the `extra_instructions` parameter:
 
 ```{r}
-qc <- querychat(
+qc <- QueryChat$new(
   penguins,
   extra_instructions = "instructions.md"
 )
-
-cat(qc$system_prompt)
 ```
 
 Or as a string:
@@ -99,22 +162,29 @@ Or as a string:
 ```{r}
 instructions <- "
 - Use British spelling conventions
-- Stay on topic and only discuss the data dashboard
+- Stay on topic and only discuss the data
 - Refuse to answer unrelated questions
 "
 
-qc <- querychat(
+qc <- QueryChat$new(
   penguins,
   extra_instructions = instructions
 )
-
-cat(qc$system_prompt)
 ```
 
 ::: {.alert .alert-warning}
 LLMs may not always follow your instructions perfectly. Test extensively when changing instructions or models.
 :::
 
+## Default prompt
+
+For full visibility into the system prompt that querychat generates for the LLM, you can inspect the `system_prompt` field. This is useful for debugging and understanding exactly what context the LLM is working with:
+
+```{r}
+qc <- QueryChat$new(penguins)
+cat(qc$system_prompt)
+```
+
 ## Custom template {#custom-template}
 
 If you want more control over the system prompt, you can provide a custom prompt template using the `prompt_template` parameter. This is for more advanced users who want to fully customize the LLM's behavior. See the [QueryChat reference](../reference/QueryChat.html) for details on the available template variables.
diff --git a/pkg-r/vignettes/tools.Rmd b/pkg-r/vignettes/tools.Rmd
index 373bac17c..c1a735aa3 100644
--- a/pkg-r/vignettes/tools.Rmd
+++ b/pkg-r/vignettes/tools.Rmd
@@ -19,17 +19,26 @@ querychat combines [tool calling](https://ellmer.tidyverse.org/articles/tool-cal
 
 One important thing to understand generally about querychat's tools is they are R functions, and that execution happens on _your machine_, not on the LLM provider's side. In other words, the SQL queries generated by the LLM are executed locally in the R process running the app.
 
-querychat provides the LLM access to three tool groups:
+querychat provides the LLM access to four tool groups:
 
-1. **Data updating** - Filter and sort data (without sending results to the LLM).
-2. **Data analysis** - Calculate summaries and return results for interpretation by the LLM.
-3. **Data visualization** - Create charts inline in the chat.
+1. **Schema retrieval** - Fetch table structure before writing SQL.
+2. **Data updating** - Filter and sort data (without sending results to the LLM).
+3. **Data analysis** - Calculate summaries and return results for interpretation by the LLM.
+4. **Data visualization** - Create charts inline in the chat.
 
 ```{r}
 library(querychat)
 library(palmerpenguins)
 ```
 
+## Schema retrieval {#schema-retrieval}
+
+Before writing any SQL query, the LLM calls the `querychat_get_schema` tool to retrieve column names, types, value ranges, and descriptions for a specific table. This on-demand approach means the LLM only fetches schema for the tables it actually needs, keeping the system prompt lean and startup fast — especially when working with [multiple tables](build.html#multiple-tables) or large databases.
+
+If you've provided a [data dictionary](context.html#data-dictionary), the schema response includes your column descriptions and relationship information. Columns annotated in the data dictionary are excluded from the auto-generated schema metadata (since your description supersedes it).
+
+This tool is always registered and cannot be disabled.
+
 ## Data updating {#data-updating}
 
 When a user asks to "Show me..." or "Filter to..." or "Sort by...", the LLM requests a call to the `update_dashboard` tool with an appropriate SQL query as input. An important constraint is that the query must return all original schema columns (typically using `SELECT *`). When called, querychat will both set a reactive value holding [the current SQL query](build.html#sql-query) and execute the query to get the result. The result of query then used to set a reactive value holding the [filtered/sorted data frame](build.html#filtered-data). Thanks to reactivity, this will automatically update any views depending on this data frame, such as the data table displayed in the UI.
@@ -71,7 +80,7 @@ This tool:
 2. Renders the `VISUALISE` clause as an interactive chart
 3. Displays the chart inline in the chat
 
-Unlike the data updating tools, visualization queries don't affect the dashboard filter.
+Unlike the data updating tools, visualization queries don't affect the active data filter.
 They query the full dataset independently, and each call produces a new inline chart message in the chat.
 
 The inline chart includes controls for fullscreen viewing, saving as PNG/SVG, and a "Show Query" toggle that reveals the underlying ggsql code.
@@ -107,6 +116,7 @@ If you'd like to better understand how the tools work and how the LLM is prompte
 
 **Prompts:**
 
+- [`prompts/tool-get-schema.md`](https://github.com/posit-dev/querychat/blob/main/pkg-r/inst/prompts/tool-get-schema.md)
 - [`prompts/tool-update-dashboard.md`](https://github.com/posit-dev/querychat/blob/main/pkg-r/inst/prompts/tool-update-dashboard.md)
 - [`prompts/tool-reset-dashboard.md`](https://github.com/posit-dev/querychat/blob/main/pkg-r/inst/prompts/tool-reset-dashboard.md)
 - [`prompts/tool-query.md`](https://github.com/posit-dev/querychat/blob/main/pkg-r/inst/prompts/tool-query.md)
diff --git a/pyproject.toml b/pyproject.toml
index 373c9804d..bec6902f5 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -29,6 +29,7 @@ dependencies = [
     "chevron",
     "sqlalchemy>=2.0.0", # Using 2.0+ for improved type hints and API
     "great-tables>=0.16.0",
+    "pyyaml",
 ]
 classifiers = [
     "Programming Language :: Python",