diff --git a/.github/workflows/tests.yml b/.github/workflows/tests.yml
index 70c76d2..70fdff5 100644
--- a/.github/workflows/tests.yml
+++ b/.github/workflows/tests.yml
@@ -38,6 +38,8 @@ jobs:
         run: uv sync --all-extras --dev
 
       - name: Run tests
+        # Smoke CLI tests intentionally disable subprocess coverage collection
+        # to avoid runner-specific flakiness while keeping parent-process coverage strict.
         run: uv run pytest --cov=codeclone --cov-report=term-missing --cov-fail-under=98
 
       - name: Verify baseline exists
@@ -46,7 +48,7 @@ jobs:
 
       - name: Check for new clones vs baseline
         if: ${{ matrix.python-version == '3.13' }}
-        run: uv run codeclone . --fail-on-new --no-progress
+        run: uv run codeclone . --ci
 
   lint:
     runs-on: ubuntu-latest
diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
index 8b0f864..8609d0a 100644
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -1,9 +1,31 @@
 repos:
--   repo: local
+  - repo: local
     hooks:
-    -   id: codeclone
+      - id: ruff-check
+        name: Ruff (lint)
+        entry: ruff check .
+        language: system
+        pass_filenames: false
+        types: [ python ]
+
+      - id: ruff-format
+        name: Ruff (format)
+        entry: ruff format .
+        language: system
+        pass_filenames: false
+        types: [ python ]
+
+      - id: mypy
+        name: Mypy
+        entry: mypy .
+        language: system
+        pass_filenames: false
+        types: [ python ]
+
+      - id: codeclone
         name: CodeClone
         entry: codeclone
-        language: python
-        args: [".", "--fail-on-new"]
-        types: [python]
+        language: system
+        pass_filenames: false
+        args: [ ".", "--ci" ]
+        types: [ python ]
\ No newline at end of file
diff --git a/CHANGELOG.md b/CHANGELOG.md
index e86fef2..48213a3 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,5 +1,79 @@
 # Changelog
 
+## [1.3.0] - 2026-02-08
+
+### Overview
+
+This release improves detection precision, determinism, and auditability, adds
+segment-level reporting, refreshes the HTML report UI, and hardens baseline/cache
+contracts for CI usage.
+
+**Breaking (CI):** baseline contract checks are stricter. Legacy or mismatched baselines
+must be regenerated.
+
+### Detection Engine
+
+- Safe normalization upgrades: local logical equivalence, proven-domain commutative
+  canonicalization, and preserved symbolic call targets.
+- Internal CFG metadata markers were moved to the `__CC_META__::...` namespace and emitted
+  as synthetic AST names to prevent collisions with user string literals.
+- CFG precision upgrades: short-circuit micro-CFG, selective `try/except` raise-linking,
+  loop `break`/`continue` jump semantics, `for/while ... else`, and ordered `match`/`except`.
+- Deterministic traversal and ordering improvements for stable clone grouping/report output.
+- Segment-level internal detection added with strict candidate->hash confirmation; remains
+  report-only (not part of baseline/CI fail criteria).
+- Segment report noise reduction: overlapping windows are merged and boilerplate-only groups
+  are suppressed using deterministic AST criteria.
+
+### Baseline & CI
+
+- Baseline format is versioned (`baseline_version`, `schema_version`) and legacy baselines
+  fail fast with regeneration guidance.
+- Added tamper-evident baseline integrity for v1.3+ (`generator`, `payload_sha256`).
+- Added configurable size guards: `--max-baseline-size-mb`, `--max-cache-size-mb`.
+- Behavioral hardening: in normal mode, untrusted baseline states are ignored with warning
+  and compared as empty; in `--fail-on-new` / `--ci`, they fail fast with deterministic exit codes.
+
+Update baseline after upgrade:
+
+```bash
+codeclone . --update-baseline
+```
+
+### CLI & Reports
+
+- Added `--version`, `--cache-path` (legacy alias: `--cache-dir`), and `--ci` preset.
+- Added strict output extension validation for `--html/.html`, `--json/.json`, `--text/.txt`.
+- Summary output was redesigned for deterministic, cache-aware metrics across standard and CI modes.
+- User-facing CLI messages were centralized in `codeclone/ui_messages.py`.
+- HTML/TXT/JSON reports now include consistent provenance metadata (baseline/cache status fields).
+- Clone group/report ordering is deterministic and aligned across HTML/TXT/JSON outputs.
+
+### HTML UI
+
+- Refreshed layout with improved navigation and dashboard widgets.
+- Added command palette and keyboard shortcuts.
+- Replaced emoji icons with inline SVG icons.
+- Hardened escaping (text + attribute context) and snippet fallback behavior.
+
+### Cache & Security
+
+- Cache default moved to `<root>/.cache/codeclone/cache.json` with legacy path warning.
+- Cache schema was extended to include segment data (`CACHE_VERSION=1.1`).
+- Cache integrity uses constant-time signature checks and deep schema validation.
+- Invalid/oversized cache is ignored deterministically and rebuilt from source.
+- Added security regressions for traversal safety, report escaping, baseline/cache integrity,
+  and deterministic report ordering across formats.
+- Fixed POSIX parser CPU guard to avoid lowering `RLIMIT_CPU` hard limit.
+
+### Documentation & Packaging
+
+- Updated README and docs (`architecture`, `cfg`, `SECURITY`, `CONTRIBUTING`) to reflect
+  current contracts and behaviors.
+- Removed an invalid PyPI classifier from package metadata.
+
+---
+
 ## [1.2.1] - 2026-02-02
 
 ### Overview
diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md
index 7987e01..47ccfdf 100644
--- a/CONTRIBUTING.md
+++ b/CONTRIBUTING.md
@@ -30,6 +30,7 @@ We especially welcome contributions in the following areas:
 
 - Control Flow Graph (CFG) construction and semantics
 - AST normalization improvements
+- Segment-level clone detection and reporting
 - False-positive reduction
 - HTML report UX improvements
 - Performance optimizations
@@ -83,6 +84,25 @@ Such changes often require design-level discussion and may be staged across vers
 
 ---
 
+## Security & Safety Expectations
+
+- Assume **untrusted input** (paths and source code).
+- Add **negative tests** for any normalization or CFG change.
+- Changes must preserve determinism and avoid new false positives.
+
+---
+
+## Baseline & CI
+
+- Baselines are **versioned**. Regenerate with `codeclone . --update-baseline`
+  when detection logic or CodeClone version changes.
+- Baselines in 1.3+ are tamper-evident (`generator`, `payload_sha256`).
+- Baseline verification must use the same Python `major.minor` version.
+- In `--fail-on-new` / `--ci`, untrusted baseline states fail fast. Outside gating
+  mode, baseline is ignored with warning and comparison proceeds against an empty baseline.
+
+---
+
 ## Development Setup
 
 ```bash
@@ -96,15 +116,15 @@ pip install -e .[dev]
 Run tests:
 
 ```bash
-pytest
+uv run pytest
 ```
 
 Static checks:
 
 ```bash
-mypy
-ruff check .
-ruff format .
+uv run mypy .
+uv run ruff check .
+uv run ruff format .
 ```
 
 ---
@@ -128,6 +148,9 @@ CodeClone follows **semantic versioning**:
 - **MINOR**: new detection capabilities (for example, CFG improvements)
 - **PATCH**: bug fixes, performance improvements, and UI/UX polish
 
+Baselines are versioned. Any change to detection behavior must include documentation
+and tests, and may require baseline regeneration.
+
 ---
 
 ## License
diff --git a/README.md b/README.md
index 21b7cc9..7dea74c 100644
--- a/README.md
+++ b/README.md
@@ -1,10 +1,12 @@
 # CodeClone
 
-[![PyPI](https://img.shields.io/pypi/v/codeclone.svg)](https://pypi.org/project/codeclone/)
-[![Downloads](https://img.shields.io/pypi/dm/codeclone.svg)](https://pypi.org/project/codeclone/)
-[![tests](https://github.com/orenlab/codeclone/actions/workflows/tests.yml/badge.svg?branch=main)](https://github.com/orenlab/codeclone/actions/workflows/tests.yml)
-[![Python](https://img.shields.io/pypi/pyversions/codeclone.svg)](https://pypi.org/project/codeclone/)
-[![License](https://img.shields.io/pypi/l/codeclone.svg)](LICENSE)
+[![PyPI](https://img.shields.io/pypi/v/codeclone.svg?style=flat-square)](https://pypi.org/project/codeclone/)
+[![Downloads](https://img.shields.io/pypi/dm/codeclone.svg?style=flat-square)](https://pypi.org/project/codeclone/)
+[![tests](https://github.com/orenlab/codeclone/actions/workflows/tests.yml/badge.svg?branch=main&style=flat-square)](https://github.com/orenlab/codeclone/actions/workflows/tests.yml)
+[![Python](https://img.shields.io/pypi/pyversions/codeclone.svg?style=flat-square)](https://pypi.org/project/codeclone/)
+![CI First](https://img.shields.io/badge/CI-first-green?style=flat-square)
+![Baseline](https://img.shields.io/badge/baseline-versioned-green?style=flat-square)
+[![License](https://img.shields.io/pypi/l/codeclone.svg?style=flat-square)](LICENSE)
 
 **CodeClone** is a Python code clone detector based on **normalized Python AST and Control Flow Graphs (CFG)**.
 It helps teams discover architectural duplication and prevent new copy-paste from entering the codebase via CI.
@@ -63,6 +65,12 @@ Typical use cases:
     - no `__init__` noise,
     - size and statement-count thresholds.
 
+### Segment-level internal clone detection
+
+- Detects repeated **segment windows** inside the same function.
+- Uses a two-step deterministic match (candidate signature → strict hash).
+- Included in reports for explainability, **not** in baseline/CI failure logic.
+
 ### Control-Flow Awareness (CFG v1)
 
 - Each function is converted into a **Control Flow Graph**.
@@ -74,7 +82,11 @@ Typical use cases:
     - `with` / `async with`
     - `match` / `case` (Python 3.10+)
 - Current CFG semantics (v1):
-    - `break` and `continue` are treated as statements (no jump targets),
+    - `and` / `or` are modeled as short-circuit micro-CFG branches,
+    - `try/except` links only from statements that may raise,
+    - `break` / `continue` are modeled as terminating loop transitions with explicit targets,
+    - `for/while ... else` semantics are preserved structurally,
+    - `match case` and `except` handler order is preserved structurally,
     - after-blocks are explicit and always present,
     - focus is on **structural similarity**, not precise runtime semantics.
 
@@ -86,6 +98,7 @@ This design keeps clone detection **stable, deterministic, and low-noise**.
 - Conservative defaults tuned for real-world Python projects.
 - Explicit thresholds for size and statement count.
 - No probabilistic scoring or heuristic similarity thresholds.
+- Safe commutative normalization and local logical equivalences only.
 - Focus on *architectural duplication*, not micro-similarities.
 
 ### CI-friendly baseline mode
@@ -102,9 +115,7 @@ This design keeps clone detection **stable, deterministic, and low-noise**.
 pip install codeclone
 ```
 
-Python **3.10+** is required.
-
----
+Python 3.10+ is required.
 
 ## Quick Start
 
@@ -135,11 +146,41 @@ Generate an HTML report:
 codeclone . --html .cache/codeclone/report.html
 ```
 
+Check version:
+
+```bash
+codeclone --version
+```
+
+---
+
+## Reports and Metadata
+
+All report formats include provenance metadata for auditability:
+
+`codeclone_version`, `python_version`, `baseline_path`, `baseline_version`,
+`baseline_schema_version`, `baseline_python_version`, `baseline_loaded`,
+`baseline_status` (and cache metadata when available).
+
+baseline_status values:
+
+- `ok`
+- `missing`
+- `legacy`
+- `invalid`
+- `mismatch_version`
+- `mismatch_schema`
+- `mismatch_python`
+- `generator_mismatch`
+- `integrity_missing`
+- `integrity_failed`
+- `too_large`
+
 ---
 
 ## Baseline Workflow (Recommended)
 
-### 1. Create a baseline
+1. Create a baseline
 
 Run once on your current codebase:
 
@@ -149,21 +190,73 @@ codeclone . --update-baseline
 
 Commit the generated baseline file to the repository.
 
-### 2. Use in CI
+Baselines are versioned. If CodeClone is upgraded, regenerate the baseline to keep
+CI deterministic and explainable.
+
+Baseline format in 1.3+ is tamper-evident (generator, payload_sha256) and validated
+before baseline comparison.
+
+2. Trusted vs untrusted baseline behavior
+
+Baseline states considered untrusted:
+
+- `invalid`
+- `too_large`
+- `generator_mismatch`
+- `integrity_missing`
+- `integrity_failed`
+
+Behavior:
+
+- in normal mode, untrusted baseline is ignored with a warning (comparison falls back to empty baseline);
+- in `--fail-on-new` / `--ci`, untrusted baseline fails fast (exit code 2).
+
+3. Use in CI
+
+```bash
+codeclone . --ci
+```
+
+or:
 
 ```bash
-codeclone . --fail-on-new --no-progress
+codeclone . --ci --html .cache/codeclone/report.html
 ```
 
+`--ci` is equivalent to `--fail-on-new --no-color --quiet`.
+
 Behavior:
 
 - existing clones are allowed,
-- the build fails if *new* clones appear,
+- the build fails if new clones appear,
 - refactoring that removes duplication is always allowed.
 
-`--fail-on-new` exits with a non-zero code when new clones are detected.
+`--fail-on-new` / `--ci` exits with a non-zero code when new clones are detected.
+
+---
+
+### Cache
+
+By default, CodeClone stores the cache per project at:
+
+```bash
+<root>/.cache/codeclone/cache.json
+```
+
+You can override this path with `--cache-path` (`--cache-dir` is a legacy alias).
 
-### Python Version Consistency for Baseline Checks
+If you used an older version of CodeClone, delete the legacy cache file at
+`~/.cache/codeclone/cache.json` and add `.cache/` to `.gitignore`.
+
+Cache integrity checks are strict: signature mismatch or oversized cache files are ignored
+with an explicit warning, then rebuilt from source.
+
+Cache entries are validated against expected structure/types; invalid entries are ignored
+deterministically.
+
+---
+
+## Python Version Consistency for Baseline Checks
 
 Due to inherent differences in Python’s AST between interpreter versions, baseline
 generation and verification must be performed using the same Python version.
@@ -184,8 +277,9 @@ repos:
       - id: codeclone
         name: CodeClone
         entry: codeclone
-        language: python
-        args: [ ".", "--fail-on-new" ]
+        language: system
+        pass_filenames: false
+        args: [ ".", "--ci" ]
         types: [ python ]
 ```
 
@@ -193,30 +287,29 @@ repos:
 
 ## What CodeClone Is (and Is Not)
 
-### CodeClone **is**
+### CodeClone Is
 
 - an architectural analysis tool,
 - a duplication radar,
 - a CI guard against copy-paste,
 - a control-flow-aware clone detector.
 
-### CodeClone **is not**
+### CodeClone Is Not
 
 - a linter,
 - a formatter,
 - a semantic equivalence prover,
 - a runtime analyzer.
 
----
-
 ## How It Works (High Level)
 
 1. Parse Python source into AST.
 2. Normalize AST (names, constants, attributes, annotations).
-3. Build a **Control Flow Graph (CFG)** per function.
+3. Build a Control Flow Graph (CFG) per function.
 4. Compute stable CFG fingerprints.
-5. Detect function-level and block-level clones.
-6. Apply conservative filters to suppress noise.
+5. Extract segment windows for internal clone discovery.
+6. Detect function-level, block-level, and segment-level clones.
+7. Apply conservative filters to suppress noise.
 
 See the architectural overview:
 
@@ -226,10 +319,10 @@ See the architectural overview:
 
 ## Control Flow Graph (CFG)
 
-Starting from **version 1.1.0**, CodeClone uses a **Control Flow Graph (CFG)**
+Starting from version 1.1.0, CodeClone uses a Control Flow Graph (CFG)
 to improve structural clone detection robustness.
 
-The CFG is a **structural abstraction**, not a runtime execution model.
+The CFG is a structural abstraction, not a runtime execution model.
 
 See full design and semantics:
 
@@ -237,6 +330,32 @@ See full design and semantics:
 
 ---
 
+## CLI Options
+
+| Option                        | Description                                                          | Default                              |
+|-------------------------------|----------------------------------------------------------------------|--------------------------------------|
+| `root`                        | Project root directory to scan                                       | `.`                                  |
+| `--version`                   | Print CodeClone version and exit                                     | -                                    |
+| `--min-loc`                   | Minimum function LOC to analyze                                      | `15`                                 |
+| `--min-stmt`                  | Minimum AST statements to analyze                                    | `6`                                  |
+| `--processes`                 | Number of worker processes                                           | `4`                                  |
+| `--cache-path FILE`           | Cache file path                                                      | `<root>/.cache/codeclone/cache.json` |
+| `--cache-dir FILE`            | Legacy alias for `--cache-path`                                      | -                                    |
+| `--max-cache-size-mb MB`      | Max cache size before ignore + warning                               | `50`                                 |
+| `--baseline FILE`             | Baseline file path                                                   | `codeclone.baseline.json`            |
+| `--max-baseline-size-mb MB`   | Max baseline size; untrusted baseline fails in CI, ignored otherwise | `5`                                  |
+| `--update-baseline`           | Regenerate baseline from current results                             | `False`                              |
+| `--fail-on-new`               | Fail if new function/block clone groups appear vs baseline           | `False`                              |
+| `--fail-threshold MAX_CLONES` | Fail if total clone groups (`function + block`) exceed threshold     | `-1` (disabled)                      |
+| `--ci`                        | CI preset: `--fail-on-new --no-color --quiet`                        | `False`                              |
+| `--html FILE`                 | Write HTML report (`.html`)                                          | -                                    |
+| `--json FILE`                 | Write JSON report (`.json`)                                          | -                                    |
+| `--text FILE`                 | Write text report (`.txt`)                                           | -                                    |
+| `--no-progress`               | Disable progress bar output                                          | `False`                              |
+| `--no-color`                  | Disable ANSI colors                                                  | `False`                              |
+| `--quiet`                     | Minimize output (warnings/errors still shown)                        | `False`                              |
+| `--verbose`                   | Show hash details for new clone groups in fail output                | `False`                              |
+
 ## License
 
 MIT License
diff --git a/SECURITY.md b/SECURITY.md
index 533843a..080e1ef 100644
--- a/SECURITY.md
+++ b/SECURITY.md
@@ -9,7 +9,8 @@ The following versions currently receive security updates:
 
 | Version | Supported |
 |---------|-----------|
-| 1.2.x   | Yes       |
+| 1.3.x   | Yes       |
+| 1.2.x   | No        |
 | 1.1.x   | No        |
 | 1.0.x   | No        |
 
@@ -33,6 +34,20 @@ Potential risk areas include:
 These areas are explicitly tested and hardened, but are still the primary focus of
 ongoing security review.
 
+Additional safeguards:
+
+- HTML report content is escaped in both text and attribute contexts to prevent script injection.
+- Reports are static and do not execute analyzed code.
+- Scanner traversal is root-confined and prevents symlink-based path escape.
+- Baseline files are schema/type validated with size limits and tamper-evident integrity fields
+  (`generator`, `payload_sha256` for v1.3+).
+- Baseline integrity is tamper-evident (audit signal), not tamper-proof cryptographic signing.
+  An actor who can rewrite baseline content and recompute `payload_sha256` can still alter it.
+- In `--fail-on-new` / `--ci`, untrusted baseline states fail fast; otherwise baseline is ignored
+  with explicit warning and comparison proceeds against an empty baseline.
+- Cache files are HMAC-signed (constant-time comparison), size-limited, and ignored on mismatch.
+- Cache secrets are stored next to the cache (`.cache_secret`) and must not be committed.
+
 ---
 
 ## Reporting a Vulnerability
diff --git a/codeclone.baseline.json b/codeclone.baseline.json
index ce9a169..7dafea0 100644
--- a/codeclone.baseline.json
+++ b/codeclone.baseline.json
@@ -1,8 +1,10 @@
 {
-  "functions": [
-    "23353998d062bbdf37c345cbe5256b3f5686d956|0-19",
-    "7d573fa56fb11050f1642f18ca4bb3225e11e194|0-19"
-  ],
+  "functions": [],
   "blocks": [],
-  "python_version": "3.13"
+  "python_version": "3.13",
+  "baseline_version": "1.3.0",
+  "schema_version": 1,
+  "generator": "codeclone",
+  "payload_sha256": "92e80b05c857b796bb452de9e62985a1568874da468bc671998133975c94397a",
+  "created_at": "2026-02-08T09:54:31+00:00"
 }
\ No newline at end of file
diff --git a/codeclone/_cli_args.py b/codeclone/_cli_args.py
new file mode 100644
index 0000000..49c0ad5
--- /dev/null
+++ b/codeclone/_cli_args.py
@@ -0,0 +1,161 @@
+"""
+CodeClone — AST and CFG-based code clone detector for Python
+focused on architectural duplication.
+
+Copyright (c) 2026 Den Rozhnovskiy
+Licensed under the MIT License.
+"""
+
+from __future__ import annotations
+
+import argparse
+from typing import cast
+
+from . import ui_messages as ui
+
+
+class _HelpFormatter(argparse.ArgumentDefaultsHelpFormatter):
+    def _get_help_string(self, action: argparse.Action) -> str:
+        if action.dest == "cache_path":
+            return action.help or ""
+        return cast(str, super()._get_help_string(action))
+
+
+def build_parser(version: str) -> argparse.ArgumentParser:
+    ap = argparse.ArgumentParser(
+        prog="codeclone",
+        description="AST and CFG-based code clone detector for Python.",
+        formatter_class=_HelpFormatter,
+    )
+    ap.add_argument(
+        "--version",
+        action="version",
+        version=ui.version_output(version),
+        help=ui.HELP_VERSION,
+    )
+
+    core_group = ap.add_argument_group("Target")
+    core_group.add_argument(
+        "root",
+        nargs="?",
+        default=".",
+        help=ui.HELP_ROOT,
+    )
+
+    tune_group = ap.add_argument_group("Analysis Tuning")
+    tune_group.add_argument(
+        "--min-loc",
+        type=int,
+        default=15,
+        help=ui.HELP_MIN_LOC,
+    )
+    tune_group.add_argument(
+        "--min-stmt",
+        type=int,
+        default=6,
+        help=ui.HELP_MIN_STMT,
+    )
+    tune_group.add_argument(
+        "--processes",
+        type=int,
+        default=4,
+        help=ui.HELP_PROCESSES,
+    )
+    tune_group.add_argument(
+        "--cache-path",
+        dest="cache_path",
+        metavar="FILE",
+        default=None,
+        help=ui.HELP_CACHE_PATH,
+    )
+    tune_group.add_argument(
+        "--cache-dir",
+        dest="cache_path",
+        metavar="FILE",
+        default=None,
+        help=ui.HELP_CACHE_DIR_LEGACY,
+    )
+    tune_group.add_argument(
+        "--max-cache-size-mb",
+        type=int,
+        default=50,
+        metavar="MB",
+        help=ui.HELP_MAX_CACHE_SIZE_MB,
+    )
+
+    ci_group = ap.add_argument_group("Baseline & CI/CD")
+    ci_group.add_argument(
+        "--baseline",
+        default="codeclone.baseline.json",
+        help=ui.HELP_BASELINE,
+    )
+    ci_group.add_argument(
+        "--max-baseline-size-mb",
+        type=int,
+        default=5,
+        metavar="MB",
+        help=ui.HELP_MAX_BASELINE_SIZE_MB,
+    )
+    ci_group.add_argument(
+        "--update-baseline",
+        action="store_true",
+        help=ui.HELP_UPDATE_BASELINE,
+    )
+    ci_group.add_argument(
+        "--fail-on-new",
+        action="store_true",
+        help=ui.HELP_FAIL_ON_NEW,
+    )
+    ci_group.add_argument(
+        "--fail-threshold",
+        type=int,
+        default=-1,
+        metavar="MAX_CLONES",
+        help=ui.HELP_FAIL_THRESHOLD,
+    )
+    ci_group.add_argument(
+        "--ci",
+        action="store_true",
+        help=ui.HELP_CI,
+    )
+
+    out_group = ap.add_argument_group("Reporting")
+    out_group.add_argument(
+        "--html",
+        dest="html_out",
+        metavar="FILE",
+        help=ui.HELP_HTML,
+    )
+    out_group.add_argument(
+        "--json",
+        dest="json_out",
+        metavar="FILE",
+        help=ui.HELP_JSON,
+    )
+    out_group.add_argument(
+        "--text",
+        dest="text_out",
+        metavar="FILE",
+        help=ui.HELP_TEXT,
+    )
+    out_group.add_argument(
+        "--no-progress",
+        action="store_true",
+        help=ui.HELP_NO_PROGRESS,
+    )
+    out_group.add_argument(
+        "--no-color",
+        action="store_true",
+        help=ui.HELP_NO_COLOR,
+    )
+    out_group.add_argument(
+        "--quiet",
+        action="store_true",
+        help=ui.HELP_QUIET,
+    )
+    out_group.add_argument(
+        "--verbose",
+        action="store_true",
+        help=ui.HELP_VERBOSE,
+    )
+    return ap
diff --git a/codeclone/_cli_meta.py b/codeclone/_cli_meta.py
new file mode 100644
index 0000000..fe6a04e
--- /dev/null
+++ b/codeclone/_cli_meta.py
@@ -0,0 +1,43 @@
+"""
+CodeClone — AST and CFG-based code clone detector for Python
+focused on architectural duplication.
+
+Copyright (c) 2026 Den Rozhnovskiy
+Licensed under the MIT License.
+"""
+
+from __future__ import annotations
+
+import sys
+from pathlib import Path
+from typing import Any
+
+from .baseline import Baseline
+
+
+def _current_python_version() -> str:
+    return f"{sys.version_info.major}.{sys.version_info.minor}"
+
+
+def _build_report_meta(
+    *,
+    codeclone_version: str,
+    baseline_path: Path,
+    baseline: Baseline,
+    baseline_loaded: bool,
+    baseline_status: str,
+    cache_path: Path,
+    cache_used: bool,
+) -> dict[str, Any]:
+    return {
+        "codeclone_version": codeclone_version,
+        "python_version": _current_python_version(),
+        "baseline_path": str(baseline_path),
+        "baseline_version": baseline.baseline_version,
+        "baseline_schema_version": baseline.schema_version,
+        "baseline_python_version": baseline.python_version,
+        "baseline_loaded": baseline_loaded,
+        "baseline_status": baseline_status,
+        "cache_path": str(cache_path),
+        "cache_used": cache_used,
+    }
diff --git a/codeclone/_cli_paths.py b/codeclone/_cli_paths.py
new file mode 100644
index 0000000..4dcd72f
--- /dev/null
+++ b/codeclone/_cli_paths.py
@@ -0,0 +1,36 @@
+"""
+CodeClone — AST and CFG-based code clone detector for Python
+focused on architectural duplication.
+
+Copyright (c) 2026 Den Rozhnovskiy
+Licensed under the MIT License.
+"""
+
+from __future__ import annotations
+
+import sys
+from collections.abc import Callable
+from pathlib import Path
+
+from rich.console import Console
+
+
+def expand_path(p: str) -> Path:
+    return Path(p).expanduser().resolve()
+
+
+def _validate_output_path(
+    path: str,
+    *,
+    expected_suffix: str,
+    label: str,
+    console: Console,
+    invalid_message: Callable[..., str],
+) -> Path:
+    out = Path(path).expanduser()
+    if out.suffix.lower() != expected_suffix:
+        console.print(
+            invalid_message(label=label, path=out, expected_suffix=expected_suffix)
+        )
+        sys.exit(2)
+    return out.resolve()
diff --git a/codeclone/_cli_summary.py b/codeclone/_cli_summary.py
new file mode 100644
index 0000000..40df388
--- /dev/null
+++ b/codeclone/_cli_summary.py
@@ -0,0 +1,115 @@
+"""
+CodeClone — AST and CFG-based code clone detector for Python
+focused on architectural duplication.
+
+Copyright (c) 2026 Den Rozhnovskiy
+Licensed under the MIT License.
+"""
+
+from __future__ import annotations
+
+from rich.console import Console
+from rich.table import Table
+from rich.text import Text
+
+from . import ui_messages as ui
+
+
+def _summary_value_style(*, label: str, value: int) -> str:
+    if value == 0:
+        return "dim"
+    if label == ui.SUMMARY_LABEL_NEW_BASELINE:
+        return "bold red"
+    if label == ui.SUMMARY_LABEL_SUPPRESSED:
+        return "yellow"
+    return "bold green"
+
+
+def _build_summary_rows(
+    *,
+    files_found: int,
+    files_analyzed: int,
+    cache_hits: int,
+    files_skipped: int,
+    func_clones_count: int,
+    block_clones_count: int,
+    segment_clones_count: int,
+    suppressed_segment_groups: int,
+    new_clones_count: int,
+) -> list[tuple[str, int]]:
+    return [
+        (ui.SUMMARY_LABEL_FILES_FOUND, files_found),
+        (ui.SUMMARY_LABEL_FILES_ANALYZED, files_analyzed),
+        (ui.SUMMARY_LABEL_CACHE_HITS, cache_hits),
+        (ui.SUMMARY_LABEL_FILES_SKIPPED, files_skipped),
+        (ui.SUMMARY_LABEL_FUNCTION, func_clones_count),
+        (ui.SUMMARY_LABEL_BLOCK, block_clones_count),
+        (ui.SUMMARY_LABEL_SEGMENT, segment_clones_count),
+        (ui.SUMMARY_LABEL_SUPPRESSED, suppressed_segment_groups),
+        (ui.SUMMARY_LABEL_NEW_BASELINE, new_clones_count),
+    ]
+
+
+def _build_summary_table(rows: list[tuple[str, int]]) -> Table:
+    summary_table = Table(title=ui.SUMMARY_TITLE, show_header=True)
+    summary_table.add_column("Metric")
+    summary_table.add_column("Value", justify="right")
+    for label, value in rows:
+        summary_table.add_row(
+            label,
+            Text(str(value), style=_summary_value_style(label=label, value=value)),
+        )
+    return summary_table
+
+
+def _print_summary(
+    *,
+    console: Console,
+    quiet: bool,
+    files_found: int,
+    files_analyzed: int,
+    cache_hits: int,
+    files_skipped: int,
+    func_clones_count: int,
+    block_clones_count: int,
+    segment_clones_count: int,
+    suppressed_segment_groups: int,
+    new_clones_count: int,
+) -> None:
+    invariant_ok = files_found == (files_analyzed + cache_hits + files_skipped)
+    rows = _build_summary_rows(
+        files_found=files_found,
+        files_analyzed=files_analyzed,
+        cache_hits=cache_hits,
+        files_skipped=files_skipped,
+        func_clones_count=func_clones_count,
+        block_clones_count=block_clones_count,
+        segment_clones_count=segment_clones_count,
+        suppressed_segment_groups=suppressed_segment_groups,
+        new_clones_count=new_clones_count,
+    )
+
+    if quiet:
+        console.print(ui.SUMMARY_TITLE)
+        console.print(
+            ui.fmt_summary_compact_input(
+                found=files_found,
+                analyzed=files_analyzed,
+                cache_hits=cache_hits,
+                skipped=files_skipped,
+            )
+        )
+        console.print(
+            ui.fmt_summary_compact_clones(
+                function=func_clones_count,
+                block=block_clones_count,
+                segment=segment_clones_count,
+                suppressed=suppressed_segment_groups,
+                new=new_clones_count,
+            )
+        )
+    else:
+        console.print(_build_summary_table(rows))
+
+    if not invariant_ok:
+        console.print(f"[warning]{ui.WARN_SUMMARY_ACCOUNTING_MISMATCH}[/warning]")
diff --git a/codeclone/_html_escape.py b/codeclone/_html_escape.py
new file mode 100644
index 0000000..16f7ae4
--- /dev/null
+++ b/codeclone/_html_escape.py
@@ -0,0 +1,35 @@
+"""
+CodeClone — AST and CFG-based code clone detector for Python
+focused on architectural duplication.
+
+Copyright (c) 2026 Den Rozhnovskiy
+Licensed under the MIT License.
+"""
+
+from __future__ import annotations
+
+import html
+from typing import Any
+
+
+def _escape_html(v: Any) -> str:
+    text = html.escape("" if v is None else str(v), quote=True)
+    text = text.replace("`", "&#96;")
+    text = text.replace("\u2028", "&#8232;").replace("\u2029", "&#8233;")
+    return text
+
+
+def _escape_attr(v: Any) -> str:
+    text = html.escape("" if v is None else str(v), quote=True)
+    text = text.replace("`", "&#96;")
+    text = text.replace("\u2028", "&#8232;").replace("\u2029", "&#8233;")
+    return text
+
+
+def _meta_display(v: Any) -> str:
+    if isinstance(v, bool):
+        return "true" if v else "false"
+    if v is None:
+        return "n/a"
+    text = str(v).strip()
+    return text if text else "n/a"
diff --git a/codeclone/_html_snippets.py b/codeclone/_html_snippets.py
new file mode 100644
index 0000000..915cb1d
--- /dev/null
+++ b/codeclone/_html_snippets.py
@@ -0,0 +1,208 @@
+"""
+CodeClone — AST and CFG-based code clone detector for Python
+focused on architectural duplication.
+
+Copyright (c) 2026 Den Rozhnovskiy
+Licensed under the MIT License.
+"""
+
+from __future__ import annotations
+
+import html
+import importlib
+import itertools
+from collections.abc import Iterable
+from dataclasses import dataclass
+from functools import lru_cache
+from typing import Any, NamedTuple, cast
+
+from .errors import FileProcessingError
+
+
+def pairwise(iterable: Iterable[Any]) -> Iterable[tuple[Any, Any]]:
+    a, b = itertools.tee(iterable)
+    next(b, None)
+    return zip(a, b, strict=False)
+
+
+@dataclass(slots=True)
+class _Snippet:
+    filepath: str
+    start_line: int
+    end_line: int
+    code_html: str
+
+
+class _FileCache:
+    __slots__ = ("_get_lines_impl", "maxsize")
+
+    def __init__(self, maxsize: int = 128) -> None:
+        self.maxsize = maxsize
+        self._get_lines_impl = lru_cache(maxsize=maxsize)(self._read_file_range)
+
+    @staticmethod
+    def _read_file_range(
+        filepath: str, start_line: int, end_line: int
+    ) -> tuple[str, ...]:
+        if start_line < 1:
+            start_line = 1
+        if end_line < start_line:
+            return ()
+
+        try:
+
+            def _read_with_errors(errors: str) -> tuple[str, ...]:
+                lines: list[str] = []
+                with open(filepath, encoding="utf-8", errors=errors) as f:
+                    for lineno, line in enumerate(f, start=1):
+                        if lineno < start_line:
+                            continue
+                        if lineno > end_line:
+                            break
+                        lines.append(line.rstrip("\n"))
+                return tuple(lines)
+
+            try:
+                return _read_with_errors("strict")
+            except UnicodeDecodeError:
+                return _read_with_errors("replace")
+        except OSError as e:
+            raise FileProcessingError(f"Cannot read {filepath}: {e}") from e
+
+    def get_lines_range(
+        self, filepath: str, start_line: int, end_line: int
+    ) -> tuple[str, ...]:
+        return self._get_lines_impl(filepath, start_line, end_line)
+
+    class _CacheInfo(NamedTuple):
+        hits: int
+        misses: int
+        maxsize: int | None
+        currsize: int
+
+    def cache_info(self) -> _CacheInfo:
+        return cast(_FileCache._CacheInfo, self._get_lines_impl.cache_info())
+
+
+def _try_pygments(code: str) -> str | None:
+    try:
+        pygments = importlib.import_module("pygments")
+        formatters = importlib.import_module("pygments.formatters")
+        lexers = importlib.import_module("pygments.lexers")
+    except ImportError:
+        return None
+
+    highlight = pygments.highlight
+    formatter_cls = formatters.HtmlFormatter
+    lexer_cls = lexers.PythonLexer
+    result = highlight(code, lexer_cls(), formatter_cls(nowrap=True))
+    return result if isinstance(result, str) else None
+
+
+def _pygments_css(style_name: str) -> str:
+    """
+    Returns CSS for pygments tokens. Scoped to `.codebox` to avoid leaking styles.
+    If Pygments is not available or style missing, returns "".
+    """
+    try:
+        formatters = importlib.import_module("pygments.formatters")
+    except ImportError:
+        return ""
+
+    try:
+        formatter_cls = formatters.HtmlFormatter
+        fmt = formatter_cls(style=style_name)
+    except Exception:
+        try:
+            fmt = formatter_cls()
+        except Exception:
+            return ""
+
+    try:
+        css = fmt.get_style_defs(".codebox")
+        return css if isinstance(css, str) else ""
+    except Exception:
+        return ""
+
+
+def _prefix_css(css: str, prefix: str) -> str:
+    """
+    Prefix every selector block with `prefix `.
+    Safe enough for pygments CSS which is mostly selector blocks and comments.
+    """
+    out_lines: list[str] = []
+    for line in css.splitlines():
+        stripped = line.strip()
+        if not stripped:
+            out_lines.append(line)
+            continue
+        if stripped.startswith(("/*", "*", "*/")):
+            out_lines.append(line)
+            continue
+        if "{" in line:
+            before, after = line.split("{", 1)
+            sel = before.strip()
+            if sel:
+                out_lines.append(f"{prefix} {sel} {{ {after}".rstrip())
+            else:
+                out_lines.append(line)
+        else:
+            out_lines.append(line)
+    return "\n".join(out_lines)
+
+
+def _render_code_block(
+    *,
+    filepath: str,
+    start_line: int,
+    end_line: int,
+    file_cache: _FileCache,
+    context: int,
+    max_lines: int,
+) -> _Snippet:
+    s = max(1, start_line - context)
+    e = end_line + context
+
+    if e - s + 1 > max_lines:
+        e = s + max_lines - 1
+
+    try:
+        lines = file_cache.get_lines_range(filepath, s, e)
+    except FileProcessingError:
+        missing = (
+            '<div class="codebox"><pre><code>'
+            '<div class="line">Source file unavailable</div>'
+            "</code></pre></div>"
+        )
+        return _Snippet(
+            filepath=filepath,
+            start_line=start_line,
+            end_line=end_line,
+            code_html=missing,
+        )
+
+    numbered: list[tuple[bool, str]] = []
+    for lineno, line in enumerate(lines, start=s):
+        hit = start_line <= lineno <= end_line
+        numbered.append((hit, f"{lineno:>5} | {line.rstrip()}"))
+
+    raw = "\n".join(text for _, text in numbered)
+    highlighted = _try_pygments(raw)
+
+    if highlighted is None:
+        rendered: list[str] = []
+        for hit, text in numbered:
+            cls = "hitline" if hit else "line"
+            rendered.append(
+                f'<div class="{cls}">{html.escape(text, quote=False)}</div>'
+            )
+        body = "\n".join(rendered)
+    else:
+        body = highlighted
+
+    return _Snippet(
+        filepath=filepath,
+        start_line=start_line,
+        end_line=end_line,
+        code_html=f'<div class="codebox"><pre><code>{body}</code></pre></div>',
+    )
diff --git a/codeclone/_report_grouping.py b/codeclone/_report_grouping.py
new file mode 100644
index 0000000..3ad44ab
--- /dev/null
+++ b/codeclone/_report_grouping.py
@@ -0,0 +1,64 @@
+"""
+CodeClone — AST and CFG-based code clone detector for Python
+focused on architectural duplication.
+
+Copyright (c) 2026 Den Rozhnovskiy
+Licensed under the MIT License.
+"""
+
+from __future__ import annotations
+
+from ._report_types import GroupItem, GroupMap
+
+
+def build_groups(units: list[GroupItem]) -> GroupMap:
+    groups: GroupMap = {}
+    for u in units:
+        key = f"{u['fingerprint']}|{u['loc_bucket']}"
+        groups.setdefault(key, []).append(u)
+    return {k: v for k, v in groups.items() if len(v) > 1}
+
+
+def build_block_groups(blocks: list[GroupItem], min_functions: int = 2) -> GroupMap:
+    groups: GroupMap = {}
+    for b in blocks:
+        groups.setdefault(b["block_hash"], []).append(b)
+
+    filtered: GroupMap = {}
+    for h, items in groups.items():
+        functions = {i["qualname"] for i in items}
+        if len(functions) >= min_functions:
+            filtered[h] = items
+
+    return filtered
+
+
+def build_segment_groups(
+    segments: list[GroupItem], min_occurrences: int = 2
+) -> GroupMap:
+    sig_groups: GroupMap = {}
+    for s in segments:
+        sig_groups.setdefault(s["segment_sig"], []).append(s)
+
+    confirmed: GroupMap = {}
+    for items in sig_groups.values():
+        if len(items) < min_occurrences:
+            continue
+
+        hash_groups: GroupMap = {}
+        for item in items:
+            hash_groups.setdefault(item["segment_hash"], []).append(item)
+
+        for segment_hash, hash_items in hash_groups.items():
+            if len(hash_items) < min_occurrences:
+                continue
+
+            by_func: GroupMap = {}
+            for it in hash_items:
+                by_func.setdefault(it["qualname"], []).append(it)
+
+            for qualname, q_items in by_func.items():
+                if len(q_items) >= min_occurrences:
+                    confirmed[f"{segment_hash}|{qualname}"] = q_items
+
+    return confirmed
diff --git a/codeclone/_report_segments.py b/codeclone/_report_segments.py
new file mode 100644
index 0000000..bd985cb
--- /dev/null
+++ b/codeclone/_report_segments.py
@@ -0,0 +1,247 @@
+"""
+CodeClone — AST and CFG-based code clone detector for Python
+focused on architectural duplication.
+
+Copyright (c) 2026 Den Rozhnovskiy
+Licensed under the MIT License.
+"""
+
+from __future__ import annotations
+
+import ast
+from dataclasses import dataclass
+from pathlib import Path
+
+from ._report_types import GroupItem, GroupMap
+
+SEGMENT_MIN_UNIQUE_STMT_TYPES = 2
+
+_CONTROL_FLOW_STMTS = (
+    ast.If,
+    ast.For,
+    ast.While,
+    ast.Try,
+    ast.With,
+    ast.Match,
+    ast.AsyncFor,
+    ast.AsyncWith,
+)
+_FORBIDDEN_STMTS = (ast.Return, ast.Raise, ast.Assert)
+
+
+@dataclass(frozen=True, slots=True)
+class _SegmentAnalysis:
+    unique_stmt_types: int
+    has_control_flow: bool
+    is_boilerplate: bool
+
+
+class _QualnameCollector(ast.NodeVisitor):
+    __slots__ = ("funcs", "stack")
+
+    def __init__(self) -> None:
+        self.stack: list[str] = []
+        self.funcs: dict[str, ast.FunctionDef | ast.AsyncFunctionDef] = {}
+
+    def visit_ClassDef(self, node: ast.ClassDef) -> None:
+        self.stack.append(node.name)
+        self.generic_visit(node)
+        self.stack.pop()
+
+    def visit_FunctionDef(self, node: ast.FunctionDef) -> None:
+        name = ".".join([*self.stack, node.name]) if self.stack else node.name
+        self.funcs[name] = node
+
+    def visit_AsyncFunctionDef(self, node: ast.AsyncFunctionDef) -> None:
+        name = ".".join([*self.stack, node.name]) if self.stack else node.name
+        self.funcs[name] = node
+
+
+def _merge_segment_items(items: list[GroupItem]) -> list[GroupItem]:
+    if not items:
+        return []
+
+    items_sorted = sorted(
+        items,
+        key=lambda i: (
+            i.get("filepath", ""),
+            i.get("qualname", ""),
+            int(i.get("start_line", 0)),
+            int(i.get("end_line", 0)),
+        ),
+    )
+
+    merged: list[GroupItem] = []
+    current: GroupItem | None = None
+
+    for item in items_sorted:
+        start = int(item.get("start_line", 0))
+        end = int(item.get("end_line", 0))
+        if start <= 0 or end <= 0:
+            continue
+
+        if current is None:
+            current = dict(item)
+            current["start_line"] = start
+            current["end_line"] = end
+            current["size"] = max(1, end - start + 1)
+            continue
+
+        same_owner = current.get("filepath") == item.get("filepath") and current.get(
+            "qualname"
+        ) == item.get("qualname")
+        if same_owner and start <= int(current["end_line"]) + 1:
+            current["end_line"] = max(int(current["end_line"]), end)
+            current["size"] = max(
+                1, int(current["end_line"]) - int(current["start_line"]) + 1
+            )
+            continue
+
+        merged.append(current)
+        current = dict(item)
+        current["start_line"] = start
+        current["end_line"] = end
+        current["size"] = max(1, end - start + 1)
+
+    if current is not None:
+        merged.append(current)
+
+    return merged
+
+
+def _collect_file_functions(
+    filepath: str,
+) -> dict[str, ast.FunctionDef | ast.AsyncFunctionDef] | None:
+    try:
+        source = Path(filepath).read_text("utf-8")
+    except OSError:
+        return None
+    try:
+        tree = ast.parse(source)
+    except SyntaxError:
+        return None
+
+    collector = _QualnameCollector()
+    collector.visit(tree)
+    return collector.funcs
+
+
+def _segment_statements(
+    func_node: ast.FunctionDef | ast.AsyncFunctionDef, start_line: int, end_line: int
+) -> list[ast.stmt]:
+    body = getattr(func_node, "body", None)
+    if not isinstance(body, list):
+        return []
+    stmts: list[ast.stmt] = []
+    for stmt in body:
+        lineno = getattr(stmt, "lineno", None)
+        end = getattr(stmt, "end_lineno", None)
+        if lineno is None or end is None:
+            continue
+        if lineno >= start_line and end <= end_line:
+            stmts.append(stmt)
+    return stmts
+
+
+def _assign_targets_attribute_only(stmt: ast.stmt) -> bool:
+    if isinstance(stmt, ast.Assign):
+        return all(isinstance(t, ast.Attribute) for t in stmt.targets)
+    if isinstance(stmt, ast.AnnAssign):
+        return isinstance(stmt.target, ast.Attribute)
+    return False
+
+
+def _analyze_segment_statements(stmts: list[ast.stmt]) -> _SegmentAnalysis | None:
+    if not stmts:
+        return None
+
+    unique_types = {type(s) for s in stmts}
+    has_control_flow = any(isinstance(s, _CONTROL_FLOW_STMTS) for s in stmts)
+    has_forbidden = any(isinstance(s, _FORBIDDEN_STMTS) for s in stmts)
+    has_call_stmt = any(
+        isinstance(s, ast.Expr) and isinstance(s.value, ast.Call) for s in stmts
+    )
+
+    assign_stmts = [s for s in stmts if isinstance(s, (ast.Assign, ast.AnnAssign))]
+    assign_ratio = len(assign_stmts) / len(stmts)
+    assign_attr_only = all(_assign_targets_attribute_only(s) for s in assign_stmts)
+
+    is_boilerplate = (
+        assign_ratio >= 0.8
+        and assign_attr_only
+        and not has_control_flow
+        and not has_forbidden
+        and not has_call_stmt
+    )
+
+    return _SegmentAnalysis(
+        unique_stmt_types=len(unique_types),
+        has_control_flow=has_control_flow,
+        is_boilerplate=is_boilerplate,
+    )
+
+
+def prepare_segment_report_groups(
+    segment_groups: GroupMap,
+) -> tuple[GroupMap, int]:
+    """
+    Merge overlapping segment windows and suppress low-value boilerplate groups
+    for reporting. Detection hashes remain unchanged.
+    """
+    suppressed = 0
+    filtered: GroupMap = {}
+    file_cache: dict[str, dict[str, ast.FunctionDef | ast.AsyncFunctionDef] | None] = {}
+
+    for key, items in segment_groups.items():
+        merged_items = _merge_segment_items(items)
+        if not merged_items:
+            continue
+
+        analyses: list[_SegmentAnalysis] = []
+        unknown = False
+        for item in merged_items:
+            filepath = str(item.get("filepath", ""))
+            qualname = str(item.get("qualname", ""))
+            start_line = int(item.get("start_line", 0))
+            end_line = int(item.get("end_line", 0))
+            if not filepath or not qualname or start_line <= 0 or end_line <= 0:
+                unknown = True
+                break
+
+            if filepath not in file_cache:
+                file_cache[filepath] = _collect_file_functions(filepath)
+            funcs = file_cache[filepath]
+            if not funcs:
+                unknown = True
+                break
+
+            local_name = qualname.split(":", 1)[1] if ":" in qualname else qualname
+            func_node = funcs.get(local_name)
+            if func_node is None:
+                unknown = True
+                break
+
+            stmts = _segment_statements(func_node, start_line, end_line)
+            analysis = _analyze_segment_statements(stmts)
+            if analysis is None:
+                unknown = True
+                break
+            analyses.append(analysis)
+
+        if unknown:
+            filtered[key] = merged_items
+            continue
+
+        all_boilerplate = all(a.is_boilerplate for a in analyses)
+        all_too_simple = all(
+            (not a.has_control_flow)
+            and (a.unique_stmt_types < SEGMENT_MIN_UNIQUE_STMT_TYPES)
+            for a in analyses
+        )
+        if all_boilerplate or all_too_simple:
+            suppressed += 1
+            continue
+
+        filtered[key] = merged_items
+
+    return filtered, suppressed
diff --git a/codeclone/_report_serialize.py b/codeclone/_report_serialize.py
new file mode 100644
index 0000000..54dcef5
--- /dev/null
+++ b/codeclone/_report_serialize.py
@@ -0,0 +1,160 @@
+"""
+CodeClone — AST and CFG-based code clone detector for Python
+focused on architectural duplication.
+
+Copyright (c) 2026 Den Rozhnovskiy
+Licensed under the MIT License.
+"""
+
+from __future__ import annotations
+
+import json
+from collections.abc import Mapping
+from typing import Any
+
+from ._report_types import GroupItem, GroupMap
+
+
+def to_json(groups: GroupMap) -> str:
+    def _sorted_items(items: list[GroupItem]) -> list[GroupItem]:
+        return sorted(
+            items,
+            key=lambda item: (
+                str(item.get("filepath", "")),
+                int(item.get("start_line", 0)),
+                int(item.get("end_line", 0)),
+                str(item.get("qualname", "")),
+            ),
+        )
+
+    return json.dumps(
+        {
+            "group_count": len(groups),
+            "groups": [
+                {"key": k, "count": len(v), "items": _sorted_items(v)}
+                for k, v in sorted(
+                    groups.items(),
+                    key=lambda kv: (-len(kv[1]), kv[0]),
+                )
+            ],
+        },
+        ensure_ascii=False,
+        indent=2,
+    )
+
+
+def to_json_report(
+    func_groups: GroupMap,
+    block_groups: GroupMap,
+    segment_groups: GroupMap,
+    meta: Mapping[str, Any] | None = None,
+) -> str:
+    def _sorted_items(items: list[GroupItem]) -> list[GroupItem]:
+        return sorted(
+            items,
+            key=lambda item: (
+                str(item.get("filepath", "")),
+                int(item.get("start_line", 0)),
+                int(item.get("end_line", 0)),
+                str(item.get("qualname", "")),
+            ),
+        )
+
+    def _sorted_group_map(groups: GroupMap) -> GroupMap:
+        return {
+            k: _sorted_items(v)
+            for k, v in sorted(groups.items(), key=lambda kv: (-len(kv[1]), kv[0]))
+        }
+
+    meta_payload = dict(meta or {})
+    func_sorted = _sorted_group_map(func_groups)
+    block_sorted = _sorted_group_map(block_groups)
+    segment_sorted = _sorted_group_map(segment_groups)
+    return json.dumps(
+        {
+            "meta": meta_payload,
+            "function_clones": func_sorted,
+            "block_clones": block_sorted,
+            "segment_clones": segment_sorted,
+            # Backward-compatible keys.
+            "functions": func_sorted,
+            "blocks": block_sorted,
+            "segments": segment_sorted,
+        },
+        ensure_ascii=False,
+        indent=2,
+    )
+
+
+def to_text(groups: GroupMap) -> str:
+    lines: list[str] = []
+    for i, (_, v) in enumerate(
+        sorted(groups.items(), key=lambda kv: (-len(kv[1]), kv[0]))
+    ):
+        items = sorted(
+            v,
+            key=lambda item: (
+                str(item.get("filepath", "")),
+                int(item.get("start_line", 0)),
+                int(item.get("end_line", 0)),
+                str(item.get("qualname", "")),
+            ),
+        )
+        lines.append(f"\n=== Clone group #{i + 1} (count={len(v)}) ===")
+        lines.extend(
+            [
+                f"- {item['qualname']} "
+                f"{item['filepath']}:{item['start_line']}-{item['end_line']} "
+                f"loc={item.get('loc', item.get('size'))}"
+                for item in items
+            ]
+        )
+    return "\n".join(lines).strip() + "\n"
+
+
+def _format_meta_text_value(value: Any) -> str:
+    if isinstance(value, bool):
+        return "true" if value else "false"
+    if value is None:
+        return "n/a"
+    text = str(value).strip()
+    return text if text else "n/a"
+
+
+def to_text_report(
+    *,
+    meta: Mapping[str, Any],
+    func_groups: GroupMap,
+    block_groups: GroupMap,
+    segment_groups: GroupMap,
+) -> str:
+    lines = [
+        "REPORT METADATA",
+        f"CodeClone version: {_format_meta_text_value(meta.get('codeclone_version'))}",
+        f"Python version: {_format_meta_text_value(meta.get('python_version'))}",
+        f"Baseline path: {_format_meta_text_value(meta.get('baseline_path'))}",
+        f"Baseline version: {_format_meta_text_value(meta.get('baseline_version'))}",
+        "Baseline schema version: "
+        f"{_format_meta_text_value(meta.get('baseline_schema_version'))}",
+        "Baseline Python version: "
+        f"{_format_meta_text_value(meta.get('baseline_python_version'))}",
+        f"Baseline loaded: {_format_meta_text_value(meta.get('baseline_loaded'))}",
+        f"Baseline status: {_format_meta_text_value(meta.get('baseline_status'))}",
+    ]
+    if "cache_path" in meta:
+        lines.append(f"Cache path: {_format_meta_text_value(meta.get('cache_path'))}")
+    if "cache_used" in meta:
+        lines.append(f"Cache used: {_format_meta_text_value(meta.get('cache_used'))}")
+
+    sections = [
+        ("FUNCTION CLONES", func_groups),
+        ("BLOCK CLONES", block_groups),
+        ("SEGMENT CLONES", segment_groups),
+    ]
+    for title, groups in sections:
+        lines.append("")
+        lines.append(title)
+        block = to_text(groups).rstrip()
+        lines.append(block if block else "(none)")
+
+    return "\n".join(lines).rstrip() + "\n"
diff --git a/codeclone/_report_types.py b/codeclone/_report_types.py
new file mode 100644
index 0000000..6fbe632
--- /dev/null
+++ b/codeclone/_report_types.py
@@ -0,0 +1,14 @@
+"""
+CodeClone — AST and CFG-based code clone detector for Python
+focused on architectural duplication.
+
+Copyright (c) 2026 Den Rozhnovskiy
+Licensed under the MIT License.
+"""
+
+from __future__ import annotations
+
+from typing import Any
+
+GroupItem = dict[str, Any]
+GroupMap = dict[str, list[GroupItem]]
diff --git a/codeclone/baseline.py b/codeclone/baseline.py
index 74f2030..4e0894f 100644
--- a/codeclone/baseline.py
+++ b/codeclone/baseline.py
@@ -8,58 +8,155 @@
 
 from __future__ import annotations
 
+import hashlib
+import hmac
 import json
 from collections.abc import Mapping
+from datetime import datetime, timezone
 from pathlib import Path
 from typing import Any
 
+from . import __version__
+from .errors import BaselineValidationError
+
+BASELINE_SCHEMA_VERSION = 1
+MAX_BASELINE_SIZE_BYTES = 5 * 1024 * 1024
+BASELINE_GENERATOR = "codeclone"
+
 
 class Baseline:
-    __slots__ = ("blocks", "functions", "path", "python_version")
+    __slots__ = (
+        "baseline_version",
+        "blocks",
+        "created_at",
+        "functions",
+        "generator",
+        "path",
+        "payload_sha256",
+        "python_version",
+        "schema_version",
+    )
 
     def __init__(self, path: str | Path):
         self.path = Path(path)
         self.functions: set[str] = set()
         self.blocks: set[str] = set()
         self.python_version: str | None = None
+        self.baseline_version: str | None = None
+        self.schema_version: int | None = None
+        self.generator: str | None = None
+        self.payload_sha256: str | None = None
+        self.created_at: str | None = None
 
-    def load(self) -> None:
+    def load(self, *, max_size_bytes: int | None = None) -> None:
         if not self.path.exists():
             return
+        size_limit = (
+            MAX_BASELINE_SIZE_BYTES if max_size_bytes is None else max_size_bytes
+        )
 
         try:
-            data = json.loads(self.path.read_text("utf-8"))
-            self.functions = set(data.get("functions", []))
-            self.blocks = set(data.get("blocks", []))
-            python_version = data.get("python_version")
-            self.python_version = (
-                python_version if isinstance(python_version, str) else None
+            size = self.path.stat().st_size
+        except OSError as e:
+            raise BaselineValidationError(
+                f"Cannot stat baseline file at {self.path}: {e}"
+            ) from e
+        if size > size_limit:
+            raise BaselineValidationError(
+                "Baseline file is too large "
+                f"({size} bytes, max {size_limit} bytes) at {self.path}",
+                status="too_large",
             )
+
+        try:
+            data = json.loads(self.path.read_text("utf-8"))
         except json.JSONDecodeError as e:
-            raise ValueError(f"Corrupted baseline file at {self.path}: {e}") from e
+            raise BaselineValidationError(
+                f"Corrupted baseline file at {self.path}: {e}"
+            ) from e
+
+        if not isinstance(data, dict):
+            raise BaselineValidationError(
+                f"Baseline payload must be an object at {self.path}"
+            )
+
+        functions = _require_str_list(data, "functions", path=self.path)
+        blocks = _require_str_list(data, "blocks", path=self.path)
+        python_version = _optional_str(data, "python_version", path=self.path)
+        baseline_version = _optional_str(data, "baseline_version", path=self.path)
+        schema_version = _optional_int(data, "schema_version", path=self.path)
+        generator = _optional_str_loose(data, "generator")
+        payload_sha256 = _optional_str_loose(data, "payload_sha256")
+        created_at = _optional_str(data, "created_at", path=self.path)
+
+        self.functions = set(functions)
+        self.blocks = set(blocks)
+        self.python_version = python_version
+        self.baseline_version = baseline_version
+        self.schema_version = schema_version
+        self.generator = generator
+        self.payload_sha256 = payload_sha256
+        self.created_at = created_at
 
     def save(self) -> None:
         self.path.parent.mkdir(parents=True, exist_ok=True)
+        now_utc = datetime.now(timezone.utc).replace(microsecond=0).isoformat()
         self.path.write_text(
             json.dumps(
-                _baseline_payload(self.functions, self.blocks, self.python_version),
+                _baseline_payload(
+                    self.functions,
+                    self.blocks,
+                    self.python_version,
+                    self.baseline_version,
+                    self.schema_version,
+                    self.generator,
+                    now_utc,
+                ),
                 indent=2,
                 ensure_ascii=False,
             ),
             "utf-8",
         )
 
+    def is_legacy_format(self) -> bool:
+        return self.baseline_version is None or self.schema_version is None
+
+    def verify_integrity(self) -> None:
+        if self.is_legacy_format():
+            return
+        if self.generator != BASELINE_GENERATOR:
+            raise BaselineValidationError(
+                "Baseline generator mismatch: expected 'codeclone'.",
+                status="generator_mismatch",
+            )
+        if not isinstance(self.payload_sha256, str):
+            raise BaselineValidationError(
+                "Baseline integrity payload hash is missing.",
+                status="integrity_missing",
+            )
+        expected = _compute_payload_sha256(self.functions, self.blocks)
+        if not hmac.compare_digest(self.payload_sha256, expected):
+            raise BaselineValidationError(
+                "Baseline integrity check failed: payload_sha256 mismatch.",
+                status="integrity_failed",
+            )
+
     @staticmethod
     def from_groups(
         func_groups: Mapping[str, object],
         block_groups: Mapping[str, object],
         path: str | Path = "",
         python_version: str | None = None,
+        baseline_version: str | None = None,
+        schema_version: int | None = None,
     ) -> Baseline:
         bl = Baseline(path)
         bl.functions = set(func_groups.keys())
         bl.blocks = set(block_groups.keys())
         bl.python_version = python_version
+        bl.baseline_version = baseline_version
+        bl.schema_version = schema_version
+        bl.generator = BASELINE_GENERATOR
         return bl
 
     def diff(
@@ -74,11 +171,75 @@ def _baseline_payload(
     functions: set[str],
     blocks: set[str],
     python_version: str | None,
+    baseline_version: str | None,
+    schema_version: int | None,
+    generator: str | None,
+    created_at: str | None,
 ) -> dict[str, Any]:
-    payload: dict[str, Any] = {
-        "functions": sorted(functions),
-        "blocks": sorted(blocks),
-    }
+    payload: dict[str, Any] = _canonical_payload(functions, blocks)
     if python_version:
         payload["python_version"] = python_version
+    payload["baseline_version"] = baseline_version or __version__
+    payload["schema_version"] = (
+        schema_version if schema_version is not None else BASELINE_SCHEMA_VERSION
+    )
+    payload["generator"] = generator or BASELINE_GENERATOR
+    payload["payload_sha256"] = _compute_payload_sha256(functions, blocks)
+    if created_at:
+        payload["created_at"] = created_at
     return payload
+
+
+def _canonical_payload(functions: set[str], blocks: set[str]) -> dict[str, list[str]]:
+    return {
+        "functions": sorted(functions),
+        "blocks": sorted(blocks),
+    }
+
+
+def _compute_payload_sha256(functions: set[str], blocks: set[str]) -> str:
+    serialized = json.dumps(
+        _canonical_payload(functions, blocks),
+        sort_keys=True,
+        separators=(",", ":"),
+        ensure_ascii=False,
+    )
+    return hashlib.sha256(serialized.encode("utf-8")).hexdigest()
+
+
+def _require_str_list(data: dict[str, Any], key: str, *, path: Path) -> list[str]:
+    value = data.get(key)
+    if not isinstance(value, list) or not all(isinstance(v, str) for v in value):
+        raise BaselineValidationError(
+            f"Invalid baseline schema at {path}: '{key}' must be list[str]"
+        )
+    return value
+
+
+def _optional_str(data: dict[str, Any], key: str, *, path: Path) -> str | None:
+    value = data.get(key)
+    if value is None:
+        return None
+    if not isinstance(value, str):
+        raise BaselineValidationError(
+            f"Invalid baseline schema at {path}: '{key}' must be string"
+        )
+    return value
+
+
+def _optional_int(data: dict[str, Any], key: str, *, path: Path) -> int | None:
+    value = data.get(key)
+    if value is None:
+        return None
+    if not isinstance(value, int):
+        raise BaselineValidationError(
+            f"Invalid baseline schema at {path}: '{key}' must be integer"
+        )
+    return value
+
+
+def _optional_str_loose(data: dict[str, Any], key: str) -> str | None:
+    value = data.get(key)
+    if isinstance(value, str):
+        return value
+    return None
diff --git a/codeclone/blocks.py b/codeclone/blocks.py
index 551d243..3469361 100644
--- a/codeclone/blocks.py
+++ b/codeclone/blocks.py
@@ -12,6 +12,7 @@
 from dataclasses import dataclass
 
 from .blockhash import stmt_hash
+from .fingerprint import sha1
 from .normalize import NormalizationConfig
 
 
@@ -25,6 +26,17 @@ class BlockUnit:
     size: int
 
 
+@dataclass(frozen=True, slots=True)
+class SegmentUnit:
+    segment_hash: str
+    segment_sig: str
+    filepath: str
+    qualname: str
+    start_line: int
+    end_line: int
+    size: int
+
+
 def extract_blocks(
     func_node: ast.AST,
     *,
@@ -72,3 +84,48 @@ def extract_blocks(
             break
 
     return blocks
+
+
+def extract_segments(
+    func_node: ast.AST,
+    *,
+    filepath: str,
+    qualname: str,
+    cfg: NormalizationConfig,
+    window_size: int,
+    max_segments: int,
+) -> list[SegmentUnit]:
+    body = getattr(func_node, "body", None)
+    if not isinstance(body, list) or len(body) < window_size:
+        return []
+
+    stmt_hashes = [stmt_hash(stmt, cfg) for stmt in body]
+
+    segments: list[SegmentUnit] = []
+
+    for i in range(len(stmt_hashes) - window_size + 1):
+        start = getattr(body[i], "lineno", None)
+        end = getattr(body[i + window_size - 1], "end_lineno", None)
+        if not start or not end:
+            continue
+
+        window = stmt_hashes[i : i + window_size]
+        segment_hash = sha1("|".join(window))
+        segment_sig = sha1("|".join(sorted(window)))
+
+        segments.append(
+            SegmentUnit(
+                segment_hash=segment_hash,
+                segment_sig=segment_sig,
+                filepath=filepath,
+                qualname=qualname,
+                start_line=start,
+                end_line=end,
+                size=window_size,
+            )
+        )
+
+        if len(segments) >= max_segments:
+            break
+
+    return segments
diff --git a/codeclone/cache.py b/codeclone/cache.py
index f652d17..566e82e 100644
--- a/codeclone/cache.py
+++ b/codeclone/cache.py
@@ -19,11 +19,14 @@
 from typing import TYPE_CHECKING, Any, TypedDict, cast
 
 if TYPE_CHECKING:
-    from .blocks import BlockUnit
+    from .blocks import BlockUnit, SegmentUnit
     from .extractor import Unit
 
 from .errors import CacheError
 
+OS_NAME = os.name
+MAX_CACHE_SIZE_BYTES = 50 * 1024 * 1024
+
 
 class FileStat(TypedDict):
     mtime_ns: int
@@ -50,10 +53,21 @@ class BlockDict(TypedDict):
     size: int
 
 
+class SegmentDict(TypedDict):
+    segment_hash: str
+    segment_sig: str
+    filepath: str
+    qualname: str
+    start_line: int
+    end_line: int
+    size: int
+
+
 class CacheEntry(TypedDict):
     stat: FileStat
     units: list[UnitDict]
     blocks: list[BlockDict]
+    segments: list[SegmentDict]
 
 
 class CacheData(TypedDict):
@@ -62,14 +76,17 @@ class CacheData(TypedDict):
 
 
 class Cache:
-    __slots__ = ("data", "load_warning", "path", "secret")
-    CACHE_VERSION = "1.0"
+    __slots__ = ("data", "load_warning", "max_size_bytes", "path", "secret")
+    CACHE_VERSION = "1.1"
 
-    def __init__(self, path: str | Path):
+    def __init__(self, path: str | Path, *, max_size_bytes: int | None = None):
         self.path = Path(path)
         self.data: CacheData = {"version": self.CACHE_VERSION, "files": {}}
         self.secret = self._load_secret()
         self.load_warning: str | None = None
+        self.max_size_bytes = (
+            MAX_CACHE_SIZE_BYTES if max_size_bytes is None else max_size_bytes
+        )
 
     def _load_secret(self) -> bytes:
         """Load or create cache signing secret."""
@@ -85,7 +102,7 @@ def _load_secret(self) -> bytes:
                 self.path.parent.mkdir(parents=True, exist_ok=True)
                 secret_path.write_bytes(secret)
                 # Set restrictive permissions on secret file (Unix only)
-                if os.name == "posix":
+                if OS_NAME == "posix":
                     secret_path.chmod(0o600)
             except OSError:
                 pass
@@ -102,6 +119,15 @@ def load(self) -> None:
             return
 
         try:
+            size = self.path.stat().st_size
+            if size > self.max_size_bytes:
+                self.load_warning = (
+                    "Cache file too large "
+                    f"({size} bytes, max {self.max_size_bytes}); ignoring cache."
+                )
+                self.data = {"version": self.CACHE_VERSION, "files": {}}
+                return
+
             raw = json.loads(self.path.read_text("utf-8"))
             stored_sig = raw.get("_signature")
 
@@ -110,7 +136,10 @@ def load(self) -> None:
 
             # Verify signature
             expected_sig = self._sign_data(data)
-            if stored_sig != expected_sig:
+            if not (
+                isinstance(stored_sig, str)
+                and hmac.compare_digest(stored_sig, expected_sig)
+            ):
                 self.load_warning = "Cache signature mismatch; ignoring cache."
                 self.data = {"version": self.CACHE_VERSION, "files": {}}
                 return
@@ -129,7 +158,7 @@ def load(self) -> None:
                 self.data = {"version": self.CACHE_VERSION, "files": {}}
                 return
 
-            self.data = cast(CacheData, data)
+            self.data = cast(CacheData, cast(object, data))
             self.load_warning = None
 
         except (json.JSONDecodeError, ValueError):
@@ -159,10 +188,22 @@ def get_file_entry(self, filepath: str) -> CacheEntry | None:
         if not isinstance(entry, dict):
             return None
 
-        required = {"stat", "units", "blocks"}
+        required = {"stat", "units", "blocks", "segments"}
         if not required.issubset(entry.keys()):
             return None
 
+        stat = entry.get("stat")
+        units = entry.get("units")
+        blocks = entry.get("blocks")
+        segments = entry.get("segments")
+        if not (
+            _is_file_stat_dict(stat)
+            and _is_unit_list(units)
+            and _is_block_list(blocks)
+            and _is_segment_list(segments)
+        ):
+            return None
+
         return entry
 
     def put_file_entry(
@@ -171,11 +212,15 @@ def put_file_entry(
         stat_sig: FileStat,
         units: list[Unit],
         blocks: list[BlockUnit],
+        segments: list[SegmentUnit],
     ) -> None:
         self.data["files"][filepath] = {
             "stat": stat_sig,
             "units": cast(list[UnitDict], cast(object, [asdict(u) for u in units])),
             "blocks": cast(list[BlockDict], cast(object, [asdict(b) for b in blocks])),
+            "segments": cast(
+                list[SegmentDict], cast(object, [asdict(s) for s in segments])
+            ),
         }
 
 
@@ -185,3 +230,56 @@ def file_stat_signature(path: str) -> FileStat:
         "mtime_ns": st.st_mtime_ns,
         "size": st.st_size,
     }
+
+
+def _is_file_stat_dict(value: object) -> bool:
+    if not isinstance(value, dict):
+        return False
+    return isinstance(value.get("mtime_ns"), int) and isinstance(value.get("size"), int)
+
+
+def _is_unit_dict(value: object) -> bool:
+    if not isinstance(value, dict):
+        return False
+    string_keys = ("qualname", "filepath", "fingerprint", "loc_bucket")
+    int_keys = ("start_line", "end_line", "loc", "stmt_count")
+    return _has_typed_fields(value, string_keys=string_keys, int_keys=int_keys)
+
+
+def _is_block_dict(value: object) -> bool:
+    if not isinstance(value, dict):
+        return False
+    string_keys = ("block_hash", "filepath", "qualname")
+    int_keys = ("start_line", "end_line", "size")
+    return _has_typed_fields(value, string_keys=string_keys, int_keys=int_keys)
+
+
+def _is_segment_dict(value: object) -> bool:
+    if not isinstance(value, dict):
+        return False
+    string_keys = ("segment_hash", "segment_sig", "filepath", "qualname")
+    int_keys = ("start_line", "end_line", "size")
+    return _has_typed_fields(value, string_keys=string_keys, int_keys=int_keys)
+
+
+def _is_unit_list(value: object) -> bool:
+    return isinstance(value, list) and all(_is_unit_dict(item) for item in value)
+
+
+def _is_block_list(value: object) -> bool:
+    return isinstance(value, list) and all(_is_block_dict(item) for item in value)
+
+
+def _is_segment_list(value: object) -> bool:
+    return isinstance(value, list) and all(_is_segment_dict(item) for item in value)
+
+
+def _has_typed_fields(
+    value: dict[str, object],
+    *,
+    string_keys: tuple[str, ...],
+    int_keys: tuple[str, ...],
+) -> bool:
+    return all(isinstance(value.get(key), str) for key in string_keys) and all(
+        isinstance(value.get(key), int) for key in int_keys
+    )
diff --git a/codeclone/cfg.py b/codeclone/cfg.py
index 9235a7f..625f1f8 100644
--- a/codeclone/cfg.py
+++ b/codeclone/cfg.py
@@ -10,9 +10,11 @@
 
 import ast
 from collections.abc import Iterable
+from dataclasses import dataclass
 from typing import Protocol, cast
 
 from .cfg_model import CFG, Block
+from .meta_markers import CFG_META_PREFIX
 
 __all__ = ["CFG", "CFGBuilder"]
 
@@ -26,17 +28,28 @@ class _TryLike(Protocol):
     finalbody: list[ast.stmt]
 
 
+@dataclass(slots=True)
+class _LoopContext:
+    continue_target: Block
+    break_target: Block
+
+
+def _meta_expr(value: str) -> ast.Expr:
+    return ast.Expr(value=ast.Name(id=f"{CFG_META_PREFIX}{value}", ctx=ast.Load()))
+
+
 # =========================
 # CFG Builder
 # =========================
 
 
 class CFGBuilder:
-    __slots__ = ("cfg", "current")
+    __slots__ = ("_loop_stack", "cfg", "current")
 
     def __init__(self) -> None:
         self.cfg: CFG
         self.current: Block
+        self._loop_stack: list[_LoopContext] = []
 
     def build(
         self,
@@ -73,6 +86,12 @@ def _visit(self, stmt: ast.stmt) -> None:
                 self.current.is_terminated = True
                 self.current.add_successor(self.cfg.exit)
 
+            case ast.Break():
+                self._visit_break(stmt)
+
+            case ast.Continue():
+                self._visit_continue(stmt)
+
             case ast.If():
                 self._visit_if(stmt)
 
@@ -88,7 +107,7 @@ def _visit(self, stmt: ast.stmt) -> None:
             case ast.Try():
                 self._visit_try(cast(_TryLike, stmt))
             case _ if TryStar is not None and isinstance(stmt, TryStar):
-                self._visit_try(cast(_TryLike, stmt))
+                self._visit_try(cast(_TryLike, cast(object, stmt)))
 
             case ast.With() | ast.AsyncWith():
                 self._visit_with(stmt)
@@ -102,14 +121,11 @@ def _visit(self, stmt: ast.stmt) -> None:
     # ---------- Control Flow ----------
 
     def _visit_if(self, stmt: ast.If) -> None:
-        self.current.statements.append(ast.Expr(value=stmt.test))
-
         then_block = self.cfg.create_block()
         else_block = self.cfg.create_block()
         after_block = self.cfg.create_block()
 
-        self.current.add_successor(then_block)
-        self.current.add_successor(else_block)
+        self._emit_condition(stmt.test, then_block, else_block)
 
         self.current = then_block
         self._visit_statements(stmt.body)
@@ -126,25 +142,36 @@ def _visit_if(self, stmt: ast.If) -> None:
     def _visit_while(self, stmt: ast.While) -> None:
         cond_block = self.cfg.create_block()
         body_block = self.cfg.create_block()
+        else_block = self.cfg.create_block() if stmt.orelse else None
         after_block = self.cfg.create_block()
 
         self.current.add_successor(cond_block)
 
         self.current = cond_block
-        self.current.statements.append(ast.Expr(value=stmt.test))
-        self.current.add_successor(body_block)
-        self.current.add_successor(after_block)
+        false_target = else_block if else_block is not None else after_block
+        self._emit_condition(stmt.test, body_block, false_target)
 
+        self._loop_stack.append(
+            _LoopContext(continue_target=cond_block, break_target=after_block)
+        )
         self.current = body_block
         self._visit_statements(stmt.body)
         if not self.current.is_terminated:
             self.current.add_successor(cond_block)
+        self._loop_stack.pop()
+
+        if else_block is not None:
+            self.current = else_block
+            self._visit_statements(stmt.orelse)
+            if not self.current.is_terminated:
+                self.current.add_successor(after_block)
 
         self.current = after_block
 
     def _visit_for(self, stmt: ast.For | ast.AsyncFor) -> None:
         iter_block = self.cfg.create_block()
         body_block = self.cfg.create_block()
+        else_block = self.cfg.create_block() if stmt.orelse else None
         after_block = self.cfg.create_block()
 
         self.current.add_successor(iter_block)
@@ -152,12 +179,24 @@ def _visit_for(self, stmt: ast.For | ast.AsyncFor) -> None:
         self.current = iter_block
         self.current.statements.append(ast.Expr(value=stmt.iter))
         self.current.add_successor(body_block)
-        self.current.add_successor(after_block)
+        self.current.add_successor(
+            else_block if else_block is not None else after_block
+        )
 
+        self._loop_stack.append(
+            _LoopContext(continue_target=iter_block, break_target=after_block)
+        )
         self.current = body_block
         self._visit_statements(stmt.body)
         if not self.current.is_terminated:
             self.current.add_successor(iter_block)
+        self._loop_stack.pop()
+
+        if else_block is not None:
+            self.current = else_block
+            self._visit_statements(stmt.orelse)
+            if not self.current.is_terminated:
+                self.current.add_successor(after_block)
 
         self.current = after_block
 
@@ -193,19 +232,36 @@ def _visit_try(self, stmt: _TryLike) -> None:
         self.current.add_successor(try_entry)
         self.current = try_entry
 
-        handlers_blocks = [self.cfg.create_block() for _ in stmt.handlers]
+        handler_test_blocks = [self.cfg.create_block() for _ in stmt.handlers]
+        handler_body_blocks = [self.cfg.create_block() for _ in stmt.handlers]
         else_block = self.cfg.create_block() if stmt.orelse else None
         final_block = self.cfg.create_block()
 
+        for idx, (handler, test_block, body_block) in enumerate(
+            zip(stmt.handlers, handler_test_blocks, handler_body_blocks, strict=True)
+        ):
+            test_block.statements.append(_meta_expr(f"TRY_HANDLER_INDEX:{idx}"))
+            if handler.type is not None:
+                type_repr = ast.dump(handler.type, annotate_fields=False)
+                test_block.statements.append(
+                    _meta_expr(f"TRY_HANDLER_TYPE:{type_repr}")
+                )
+            else:
+                test_block.statements.append(_meta_expr("TRY_HANDLER_TYPE:BARE"))
+            test_block.add_successor(body_block)
+            if idx + 1 < len(handler_test_blocks):
+                test_block.add_successor(handler_test_blocks[idx + 1])
+            else:
+                test_block.add_successor(final_block)
+
         # Process each statement in try body
-        # Link each to exception handlers
+        # Link only statements that can raise to exception handlers
         for stmt_node in stmt.body:
             if self.current.is_terminated:
                 break
 
-            # Current statement could raise exception
-            for h_block in handlers_blocks:
-                self.current.add_successor(h_block)
+            if _stmt_can_raise(stmt_node) and handler_test_blocks:
+                self.current.add_successor(handler_test_blocks[0])
 
             self._visit(stmt_node)
 
@@ -217,11 +273,8 @@ def _visit_try(self, stmt: _TryLike) -> None:
                 self.current.add_successor(final_block)
 
         # Process handlers
-        for handler, h_block in zip(stmt.handlers, handlers_blocks, strict=True):
-            self.current = h_block
-            if handler.type:
-                self.current.statements.append(ast.Expr(value=handler.type))
-
+        for handler, body_block in zip(stmt.handlers, handler_body_blocks, strict=True):
+            self.current = body_block
             self._visit_statements(handler.body)
             if not self.current.is_terminated:
                 self.current.add_successor(final_block)
@@ -241,23 +294,117 @@ def _visit_try(self, stmt: _TryLike) -> None:
     def _visit_match(self, stmt: ast.Match) -> None:
         self.current.statements.append(ast.Expr(value=stmt.subject))
 
-        subject_block = self.current
+        previous_test_block: Block | None = None
         after_block = self.cfg.create_block()
 
-        for case_ in stmt.cases:
-            case_block = self.cfg.create_block()
-            subject_block.add_successor(case_block)
+        for idx, case_ in enumerate(stmt.cases):
+            case_test_block = self.cfg.create_block()
+            case_body_block = self.cfg.create_block()
+
+            if previous_test_block is None:
+                self.current.add_successor(case_test_block)
+            else:
+                previous_test_block.add_successor(case_test_block)
 
-            self.current = case_block
+            case_test_block.statements.append(_meta_expr(f"MATCH_CASE_INDEX:{idx}"))
 
             # Record pattern structure
             pattern_repr = ast.dump(case_.pattern, annotate_fields=False)
-            self.current.statements.append(
-                ast.Expr(value=ast.Constant(value=f"PATTERN:{pattern_repr}"))
+            case_test_block.statements.append(
+                _meta_expr(f"MATCH_PATTERN:{pattern_repr}")
             )
+            if case_.guard is not None:
+                case_test_block.statements.append(ast.Expr(value=case_.guard))
+
+            case_test_block.add_successor(case_body_block)
 
+            self.current = case_body_block
             self._visit_statements(case_.body)
             if not self.current.is_terminated:
                 self.current.add_successor(after_block)
 
+            previous_test_block = case_test_block
+
+        if previous_test_block is not None:
+            previous_test_block.add_successor(after_block)
+
         self.current = after_block
+
+    def _emit_condition(
+        self, test: ast.expr, true_block: Block, false_block: Block
+    ) -> None:
+        if isinstance(test, ast.BoolOp) and isinstance(test.op, (ast.And, ast.Or)):
+            self._emit_boolop(test, true_block, false_block)
+            return
+
+        self.current.statements.append(ast.Expr(value=test))
+        self.current.add_successor(true_block)
+        self.current.add_successor(false_block)
+
+    def _emit_boolop(
+        self, test: ast.BoolOp, true_block: Block, false_block: Block
+    ) -> None:
+        values = test.values
+        op = test.op
+        current = self.current
+
+        for idx, value in enumerate(values):
+            current.statements.append(ast.Expr(value=value))
+            is_last = idx == len(values) - 1
+
+            if isinstance(op, ast.And):
+                if is_last:
+                    current.add_successor(true_block)
+                    current.add_successor(false_block)
+                else:
+                    next_block = self.cfg.create_block()
+                    current.add_successor(next_block)
+                    current.add_successor(false_block)
+                    current = next_block
+            else:
+                if is_last:
+                    current.add_successor(true_block)
+                    current.add_successor(false_block)
+                else:
+                    next_block = self.cfg.create_block()
+                    current.add_successor(true_block)
+                    current.add_successor(next_block)
+                    current = next_block
+
+        self.current = current
+
+    def _visit_break(self, stmt: ast.Break) -> None:
+        self.current.statements.append(stmt)
+        self.current.is_terminated = True
+        if self._loop_stack:
+            self.current.add_successor(self._loop_stack[-1].break_target)
+            return
+        self.current.add_successor(self.cfg.exit)
+
+    def _visit_continue(self, stmt: ast.Continue) -> None:
+        self.current.statements.append(stmt)
+        self.current.is_terminated = True
+        if self._loop_stack:
+            self.current.add_successor(self._loop_stack[-1].continue_target)
+            return
+        self.current.add_successor(self.cfg.exit)
+
+
+def _stmt_can_raise(stmt: ast.stmt) -> bool:
+    if isinstance(stmt, ast.Raise):
+        return True
+
+    for node in ast.walk(stmt):
+        if isinstance(
+            node,
+            (
+                ast.Call,
+                ast.Attribute,
+                ast.Subscript,
+                ast.Await,
+                ast.YieldFrom,
+            ),
+        ):
+            return True
+
+    return False
diff --git a/codeclone/cli.py b/codeclone/cli.py
index 677dbf8..0ef5832 100644
--- a/codeclone/cli.py
+++ b/codeclone/cli.py
@@ -1,6 +1,5 @@
 from __future__ import annotations
 
-import argparse
 import os
 import sys
 from concurrent.futures import ProcessPoolExecutor, as_completed
@@ -17,16 +16,33 @@
     TextColumn,
     TimeElapsedColumn,
 )
-from rich.table import Table
 from rich.theme import Theme
 
-from .baseline import Baseline
+from . import __version__
+from . import ui_messages as ui
+from ._cli_args import build_parser
+from ._cli_meta import _build_report_meta as _build_report_meta_impl
+from ._cli_meta import _current_python_version as _current_python_version_impl
+from ._cli_paths import _validate_output_path as _validate_output_path_impl
+from ._cli_paths import expand_path as _expand_path_impl
+from ._cli_summary import _build_summary_rows as _build_summary_rows_impl
+from ._cli_summary import _build_summary_table as _build_summary_table_impl
+from ._cli_summary import _print_summary as _print_summary_impl
+from ._cli_summary import _summary_value_style as _summary_value_style_impl
+from .baseline import BASELINE_SCHEMA_VERSION, Baseline
 from .cache import Cache, CacheEntry, FileStat, file_stat_signature
-from .errors import CacheError
+from .errors import BaselineValidationError, CacheError
 from .extractor import extract_units_from_source
 from .html_report import build_html_report
 from .normalize import NormalizationConfig
-from .report import build_block_groups, build_groups, to_json_report, to_text
+from .report import (
+    build_block_groups,
+    build_groups,
+    build_segment_groups,
+    prepare_segment_report_groups,
+    to_json_report,
+    to_text_report,
+)
 from .scanner import iter_py_files, module_name_from_path
 
 # Custom theme for Rich
@@ -39,10 +55,39 @@
         "dim": "dim",
     }
 )
-console = Console(theme=custom_theme, width=200)
+
+
+LEGACY_CACHE_PATH = Path("~/.cache/codeclone/cache.json").expanduser()
+
+
+def _make_console(*, no_color: bool) -> Console:
+    return Console(theme=custom_theme, width=200, no_color=no_color)
+
+
+console = _make_console(no_color=False)
 
 MAX_FILE_SIZE = 10 * 1024 * 1024  # 10MB
 BATCH_SIZE = 100
+_VALID_BASELINE_STATUSES = {
+    "ok",
+    "missing",
+    "legacy",
+    "invalid",
+    "mismatch_version",
+    "mismatch_schema",
+    "mismatch_python",
+    "generator_mismatch",
+    "integrity_missing",
+    "integrity_failed",
+    "too_large",
+}
+_UNTRUSTED_BASELINE_STATUSES = {
+    "invalid",
+    "too_large",
+    "generator_mismatch",
+    "integrity_missing",
+    "integrity_failed",
+}
 
 
 @dataclass(slots=True)
@@ -54,11 +99,12 @@ class ProcessingResult:
     error: str | None = None
     units: list[Any] | None = None
     blocks: list[Any] | None = None
+    segments: list[Any] | None = None
     stat: FileStat | None = None
 
 
 def expand_path(p: str) -> Path:
-    return Path(p).expanduser().resolve()
+    return _expand_path_impl(p)
 
 
 def process_file(
@@ -108,7 +154,7 @@ def process_file(
         stat = file_stat_signature(filepath)
         module_name = module_name_from_path(root, filepath)
 
-        units, blocks = extract_units_from_source(
+        units, blocks, segments = extract_units_from_source(
             source=source,
             filepath=filepath,
             module_name=module_name,
@@ -122,6 +168,7 @@ def process_file(
             success=True,
             units=units,
             blocks=blocks,
+            segments=segments,
             stat=stat,
         )
 
@@ -136,133 +183,193 @@ def process_file(
 def print_banner() -> None:
     console.print(
         Panel.fit(
-            "[bold white]CodeClone[/bold white] [dim]v1.2.1[/dim]\n"
-            "[italic]Architectural duplication detector[/italic]",
+            ui.banner_title(__version__),
             border_style="blue",
             padding=(0, 2),
         )
     )
 
 
-def main() -> None:
-    ap = argparse.ArgumentParser(
-        prog="codeclone",
-        description="AST and CFG-based code clone detector for Python.",
-        formatter_class=argparse.ArgumentDefaultsHelpFormatter,
+def _validate_output_path(path: str, *, expected_suffix: str, label: str) -> Path:
+    return _validate_output_path_impl(
+        path,
+        expected_suffix=expected_suffix,
+        label=label,
+        console=console,
+        invalid_message=ui.fmt_invalid_output_extension,
     )
 
-    # Core Arguments
-    core_group = ap.add_argument_group("Target")
-    core_group.add_argument(
-        "root",
-        nargs="?",
-        default=".",
-        help="Project root directory to scan.",
-    )
 
-    # Tuning
-    tune_group = ap.add_argument_group("Analysis Tuning")
-    tune_group.add_argument(
-        "--min-loc",
-        type=int,
-        default=15,
-        help="Minimum Lines of Code (LOC) to consider.",
-    )
-    tune_group.add_argument(
-        "--min-stmt",
-        type=int,
-        default=6,
-        help="Minimum AST statements to consider.",
-    )
-    tune_group.add_argument(
-        "--processes",
-        type=int,
-        default=4,
-        help="Number of parallel worker processes.",
-    )
-    tune_group.add_argument(
-        "--cache-dir",
-        default="~/.cache/codeclone/cache.json",
-        help="Path to the cache file to speed up subsequent runs.",
+def _current_python_version() -> str:
+    return _current_python_version_impl()
+
+
+def _build_report_meta(
+    *,
+    baseline_path: Path,
+    baseline: Baseline,
+    baseline_loaded: bool,
+    baseline_status: str,
+    cache_path: Path,
+    cache_used: bool,
+) -> dict[str, Any]:
+    return _build_report_meta_impl(
+        codeclone_version=__version__,
+        baseline_path=baseline_path,
+        baseline=baseline,
+        baseline_loaded=baseline_loaded,
+        baseline_status=baseline_status,
+        cache_path=cache_path,
+        cache_used=cache_used,
     )
 
-    # Baseline & CI
-    ci_group = ap.add_argument_group("Baseline & CI/CD")
-    ci_group.add_argument(
-        "--baseline",
-        default="codeclone.baseline.json",
-        help="Path to the baseline file (stored in repo).",
-    )
-    ci_group.add_argument(
-        "--update-baseline",
-        action="store_true",
-        help="Overwrite the baseline file with current results.",
-    )
-    ci_group.add_argument(
-        "--fail-on-new",
-        action="store_true",
-        help="Exit with error if NEW clones (not in baseline) are detected.",
-    )
-    ci_group.add_argument(
-        "--fail-threshold",
-        type=int,
-        default=-1,
-        metavar="MAX_CLONES",
-        help="Exit with error if total clone groups exceed this number.",
-    )
 
-    # Output
-    out_group = ap.add_argument_group("Reporting")
-    out_group.add_argument(
-        "--html",
-        dest="html_out",
-        metavar="FILE",
-        help="Generate an HTML report to FILE.",
-    )
-    out_group.add_argument(
-        "--json",
-        dest="json_out",
-        metavar="FILE",
-        help="Generate a JSON report to FILE.",
-    )
-    out_group.add_argument(
-        "--text",
-        dest="text_out",
-        metavar="FILE",
-        help="Generate a text report to FILE.",
+def _summary_value_style(*, label: str, value: int) -> str:
+    return _summary_value_style_impl(label=label, value=value)
+
+
+def _build_summary_rows(
+    *,
+    files_found: int,
+    files_analyzed: int,
+    cache_hits: int,
+    files_skipped: int,
+    func_clones_count: int,
+    block_clones_count: int,
+    segment_clones_count: int,
+    suppressed_segment_groups: int,
+    new_clones_count: int,
+) -> list[tuple[str, int]]:
+    return _build_summary_rows_impl(
+        files_found=files_found,
+        files_analyzed=files_analyzed,
+        cache_hits=cache_hits,
+        files_skipped=files_skipped,
+        func_clones_count=func_clones_count,
+        block_clones_count=block_clones_count,
+        segment_clones_count=segment_clones_count,
+        suppressed_segment_groups=suppressed_segment_groups,
+        new_clones_count=new_clones_count,
     )
-    out_group.add_argument(
-        "--no-progress",
-        action="store_true",
-        help="Disable the progress bar (recommended for CI logs).",
+
+
+def _build_summary_table(rows: list[tuple[str, int]]) -> Any:
+    return _build_summary_table_impl(rows)
+
+
+def _print_summary(
+    *,
+    quiet: bool,
+    files_found: int,
+    files_analyzed: int,
+    cache_hits: int,
+    files_skipped: int,
+    func_clones_count: int,
+    block_clones_count: int,
+    segment_clones_count: int,
+    suppressed_segment_groups: int,
+    new_clones_count: int,
+) -> None:
+    _print_summary_impl(
+        console=console,
+        quiet=quiet,
+        files_found=files_found,
+        files_analyzed=files_analyzed,
+        cache_hits=cache_hits,
+        files_skipped=files_skipped,
+        func_clones_count=func_clones_count,
+        block_clones_count=block_clones_count,
+        segment_clones_count=segment_clones_count,
+        suppressed_segment_groups=suppressed_segment_groups,
+        new_clones_count=new_clones_count,
     )
 
+
+def main() -> None:
+    ap = build_parser(__version__)
+
+    cache_path_from_args = any(
+        arg in {"--cache-dir", "--cache-path"}
+        or arg.startswith(("--cache-dir=", "--cache-path="))
+        for arg in sys.argv
+    )
     args = ap.parse_args()
 
-    print_banner()
+    if args.ci:
+        args.fail_on_new = True
+        args.no_color = True
+        args.quiet = True
+
+    if args.quiet:
+        args.no_progress = True
+
+    global console
+    console = _make_console(no_color=args.no_color)
+
+    if args.max_baseline_size_mb < 0 or args.max_cache_size_mb < 0:
+        console.print("[error]Size limits must be non-negative integers (MB).[/error]")
+        sys.exit(1)
+
+    if not args.quiet:
+        print_banner()
 
     try:
         root_path = Path(args.root).resolve()
         if not root_path.exists():
-            console.print(f"[error]Root path does not exist: {root_path}[/error]")
+            console.print(ui.ERR_ROOT_NOT_FOUND.format(path=root_path))
             sys.exit(1)
     except Exception as e:
-        console.print(f"[error]Invalid root path: {e}[/error]")
+        console.print(ui.ERR_INVALID_ROOT_PATH.format(error=e))
         sys.exit(1)
 
-    console.print(f"[info]Scanning root:[/info] {root_path}")
+    if not args.quiet:
+        console.print(ui.fmt_scanning_root(root_path))
+
+    html_out_path: Path | None = None
+    json_out_path: Path | None = None
+    text_out_path: Path | None = None
+    if args.html_out:
+        html_out_path = _validate_output_path(
+            args.html_out, expected_suffix=".html", label="HTML"
+        )
+    if args.json_out:
+        json_out_path = _validate_output_path(
+            args.json_out, expected_suffix=".json", label="JSON"
+        )
+    if args.text_out:
+        text_out_path = _validate_output_path(
+            args.text_out, expected_suffix=".txt", label="text"
+        )
 
     # Initialize Cache
     cfg = NormalizationConfig()
-    cache_path = Path(args.cache_dir).expanduser()
-    cache = Cache(cache_path)
+    if cache_path_from_args and args.cache_path:
+        cache_path = Path(args.cache_path).expanduser()
+    else:
+        cache_path = root_path / ".cache" / "codeclone" / "cache.json"
+        if LEGACY_CACHE_PATH.exists():
+            try:
+                legacy_resolved = LEGACY_CACHE_PATH.resolve()
+            except OSError:
+                legacy_resolved = LEGACY_CACHE_PATH
+            if legacy_resolved != cache_path:
+                console.print(
+                    ui.fmt_legacy_cache_warning(
+                        legacy_path=legacy_resolved, new_path=cache_path
+                    )
+                )
+    cache = Cache(cache_path, max_size_bytes=args.max_cache_size_mb * 1024 * 1024)
     cache.load()
     if cache.load_warning:
         console.print(f"[warning]{cache.load_warning}[/warning]")
 
     all_units: list[dict[str, Any]] = []
     all_blocks: list[dict[str, Any]] = []
-    changed_files_count = 0
+    all_segments: list[dict[str, Any]] = []
+    files_found = 0
+    files_analyzed = 0
+    cache_hits = 0
+    files_skipped = 0
     files_to_process: list[str] = []
 
     def _get_cached_entry(
@@ -271,7 +378,7 @@ def _get_cached_entry(
         try:
             stat = file_stat_signature(fp)
         except OSError as e:
-            return None, None, f"[warning]Skipping file {fp}: {e}[/warning]"
+            return None, None, ui.fmt_skipping_file(fp, e)
         cached = cache.get_file_entry(fp)
         return stat, cached, None
 
@@ -285,7 +392,7 @@ def _safe_process_file(fp: str) -> ProcessingResult | None:
                 args.min_stmt,
             )
         except Exception as e:
-            console.print(f"[warning]Worker failed: {e}[/warning]")
+            console.print(ui.fmt_worker_failed(e))
             return None
 
     def _safe_future_result(future: Any) -> tuple[ProcessingResult | None, str | None]:
@@ -295,14 +402,17 @@ def _safe_future_result(future: Any) -> tuple[ProcessingResult | None, str | Non
             return None, str(e)
 
     # Discovery phase
-    with console.status("[bold green]Discovering Python files...", spinner="dots"):
-        try:
+    try:
+        if args.quiet:
             for fp in iter_py_files(str(root_path)):
+                files_found += 1
                 stat, cached, warn = _get_cached_entry(fp)
                 if warn:
                     console.print(warn)
+                    files_skipped += 1
                     continue
                 if cached and cached.get("stat") == stat:
+                    cache_hits += 1
                     all_units.extend(
                         cast(
                             list[dict[str, Any]],
@@ -315,11 +425,48 @@ def _safe_future_result(future: Any) -> tuple[ProcessingResult | None, str | Non
                             cast(object, cached.get("blocks", [])),
                         )
                     )
+                    all_segments.extend(
+                        cast(
+                            list[dict[str, Any]],
+                            cast(object, cached.get("segments", [])),
+                        )
+                    )
                 else:
                     files_to_process.append(fp)
-        except Exception as e:
-            console.print(f"[error]Scan failed: {e}[/error]")
-            sys.exit(1)
+        else:
+            with console.status(ui.STATUS_DISCOVERING, spinner="dots"):
+                for fp in iter_py_files(str(root_path)):
+                    files_found += 1
+                    stat, cached, warn = _get_cached_entry(fp)
+                    if warn:
+                        console.print(warn)
+                        files_skipped += 1
+                        continue
+                    if cached and cached.get("stat") == stat:
+                        cache_hits += 1
+                        all_units.extend(
+                            cast(
+                                list[dict[str, Any]],
+                                cast(object, cached.get("units", [])),
+                            )
+                        )
+                        all_blocks.extend(
+                            cast(
+                                list[dict[str, Any]],
+                                cast(object, cached.get("blocks", [])),
+                            )
+                        )
+                        all_segments.extend(
+                            cast(
+                                list[dict[str, Any]],
+                                cast(object, cached.get("segments", [])),
+                            )
+                        )
+                    else:
+                        files_to_process.append(fp)
+    except Exception as e:
+        console.print(ui.ERR_SCAN_FAILED.format(error=e))
+        sys.exit(1)
 
     total_files = len(files_to_process)
     failed_files = []
@@ -328,23 +475,28 @@ def _safe_future_result(future: Any) -> tuple[ProcessingResult | None, str | Non
     if total_files > 0:
 
         def handle_result(result: ProcessingResult) -> None:
-            nonlocal changed_files_count
+            nonlocal files_analyzed, files_skipped
             if result.success and result.stat:
                 cache.put_file_entry(
                     result.filepath,
                     result.stat,
                     result.units or [],
                     result.blocks or [],
+                    result.segments or [],
                 )
-                changed_files_count += 1
+                files_analyzed += 1
                 if result.units:
                     all_units.extend([asdict(u) for u in result.units])
                 if result.blocks:
                     all_blocks.extend([asdict(b) for b in result.blocks])
+                if result.segments:
+                    all_segments.extend([asdict(s) for s in result.segments])
             else:
+                files_skipped += 1
                 failed_files.append(f"{result.filepath}: {result.error}")
 
         def process_sequential(with_progress: bool) -> None:
+            nonlocal files_skipped
             if with_progress:
                 with Progress(
                     SpinnerColumn(),
@@ -361,20 +513,26 @@ def process_sequential(with_progress: bool) -> None:
                         result = _safe_process_file(fp)
                         if result is not None:
                             handle_result(result)
+                        else:
+                            files_skipped += 1
+                            failed_files.append(f"{fp}: worker failed")
                         progress.advance(task)
             else:
-                console.print(f"[info]Processing {total_files} changed files...[/info]")
+                if not args.quiet:
+                    console.print(ui.fmt_processing_changed(total_files))
                 for fp in files_to_process:
                     result = _safe_process_file(fp)
                     if result is not None:
                         handle_result(result)
+                    else:
+                        files_skipped += 1
+                        failed_files.append(f"{fp}: worker failed")
 
         try:
             with ProcessPoolExecutor(max_workers=args.processes) as executor:
                 if args.no_progress:
-                    console.print(
-                        f"[info]Processing {total_files} changed files...[/info]"
-                    )
+                    if not args.quiet:
+                        console.print(ui.fmt_processing_changed(total_files))
 
                     # Process in batches to manage memory
                     for i in range(0, total_files, BATCH_SIZE):
@@ -390,16 +548,22 @@ def process_sequential(with_progress: bool) -> None:
                             )
                             for fp in batch
                         ]
+                        future_to_fp = {
+                            id(fut): fp for fut, fp in zip(futures, batch, strict=True)
+                        }
 
                         for future in as_completed(futures):
+                            fp = future_to_fp[id(future)]
                             result, err = _safe_future_result(future)
                             if result is not None:
                                 handle_result(result)
                             elif err is not None:
-                                console.print(
-                                    "[warning]Failed to process batch item: "
-                                    f"{err}[/warning]"
-                                )
+                                files_skipped += 1
+                                reason = err
+                                failed_files.append(f"{fp}: {reason}")
+                                console.print(ui.fmt_batch_item_failed(reason))
+                            else:
+                                files_skipped += 1
 
                 else:
                     with Progress(
@@ -428,82 +592,164 @@ def process_sequential(with_progress: bool) -> None:
                                 )
                                 for fp in batch
                             ]
+                            future_to_fp = {
+                                id(fut): fp
+                                for fut, fp in zip(futures, batch, strict=True)
+                            }
 
                             for future in as_completed(futures):
+                                fp = future_to_fp[id(future)]
                                 result, err = _safe_future_result(future)
                                 if result is not None:
                                     handle_result(result)
                                 elif err is not None:
+                                    files_skipped += 1
+                                    reason = err
+                                    failed_files.append(f"{fp}: {reason}")
                                     # Should rarely happen due to try/except
                                     # in process_file.
-                                    console.print(
-                                        f"[warning]Worker failed: {err}[/warning]"
-                                    )
+                                    console.print(ui.fmt_worker_failed(reason))
+                                else:
+                                    files_skipped += 1
                                 progress.advance(task)
         except (OSError, RuntimeError, PermissionError) as e:
-            console.print(
-                "[warning]Parallel processing unavailable, "
-                f"falling back to sequential: {e}[/warning]"
-            )
+            console.print(ui.fmt_parallel_fallback(e))
             process_sequential(with_progress=not args.no_progress)
 
     if failed_files:
-        console.print(
-            f"\n[warning]⚠ {len(failed_files)} files failed to process:[/warning]"
-        )
+        console.print(ui.fmt_failed_files_header(len(failed_files)))
         for failure in failed_files[:10]:
             console.print(f"  • {failure}")
         if len(failed_files) > 10:
             console.print(f"  ... and {len(failed_files) - 10} more")
 
     # Analysis phase
-    with console.status("[bold green]Grouping clones...", spinner="dots"):
+    suppressed_segment_groups = 0
+    if args.quiet:
         func_groups = build_groups(all_units)
         block_groups = build_block_groups(all_blocks)
+        segment_groups = build_segment_groups(all_segments)
+        segment_groups, suppressed_segment_groups = prepare_segment_report_groups(
+            segment_groups
+        )
         try:
             cache.save()
         except CacheError as e:
-            console.print(f"[warning]Failed to save cache: {e}[/warning]")
+            console.print(ui.fmt_cache_save_failed(e))
+    else:
+        with console.status(ui.STATUS_GROUPING, spinner="dots"):
+            func_groups = build_groups(all_units)
+            block_groups = build_block_groups(all_blocks)
+            segment_groups = build_segment_groups(all_segments)
+            segment_groups, suppressed_segment_groups = prepare_segment_report_groups(
+                segment_groups
+            )
+            try:
+                cache.save()
+            except CacheError as e:
+                console.print(ui.fmt_cache_save_failed(e))
 
     # Reporting
     func_clones_count = len(func_groups)
     block_clones_count = len(block_groups)
+    segment_clones_count = len(segment_groups)
 
     # Baseline Logic
     baseline_path = Path(args.baseline).expanduser().resolve()
 
-    # If user didn't specify path and default logic applies, baseline_path
-    # is now ./codeclone_baseline.json
+    # If user didn't specify path, the default is ./codeclone.baseline.json.
 
     baseline = Baseline(baseline_path)
     baseline_exists = baseline_path.exists()
+    baseline_loaded = False
+    baseline_status = "missing"
+    baseline_failure_code: int | None = None
+    baseline_trusted_for_diff = False
 
     if baseline_exists:
-        baseline.load()
-        if not args.update_baseline and baseline.python_version:
-            current_version = f"{sys.version_info.major}.{sys.version_info.minor}"
-            if baseline.python_version != current_version:
-                console.print(
-                    "[warning]Baseline Python version mismatch.[/warning]\n"
-                    f"Baseline was generated with Python {baseline.python_version}.\n"
-                    f"Current interpreter: Python {current_version}."
-                )
+        try:
+            baseline.load(max_size_bytes=args.max_baseline_size_mb * 1024 * 1024)
+        except BaselineValidationError as e:
+            baseline_status = (
+                e.status if e.status in _VALID_BASELINE_STATUSES else "invalid"
+            )
+            if not args.update_baseline:
+                console.print(ui.fmt_invalid_baseline(e))
                 if args.fail_on_new:
-                    console.print(
-                        "[error]Baseline checks require the same Python version to "
-                        "ensure deterministic results. Please regenerate the baseline "
-                        "using the current interpreter.[/error]"
-                    )
-                    sys.exit(2)
+                    baseline_failure_code = 2
+                else:
+                    console.print(ui.WARN_BASELINE_IGNORED)
+        else:
+            baseline_loaded = True
+            baseline_status = "ok"
+            baseline_trusted_for_diff = True
+            if not args.update_baseline:
+                if baseline.is_legacy_format():
+                    baseline_status = "legacy"
+                    console.print(ui.fmt_baseline_version_missing(__version__))
+                    baseline_failure_code = 2
+                    baseline_trusted_for_diff = False
+                else:
+                    if baseline.baseline_version != __version__:
+                        assert baseline.baseline_version is not None
+                        baseline_status = "mismatch_version"
+                        console.print(
+                            ui.fmt_baseline_version_mismatch(
+                                baseline_version=baseline.baseline_version,
+                                current_version=__version__,
+                            )
+                        )
+                        baseline_failure_code = 2
+                        baseline_trusted_for_diff = False
+                    if baseline.schema_version != BASELINE_SCHEMA_VERSION:
+                        assert baseline.schema_version is not None
+                        if baseline_status == "ok":
+                            baseline_status = "mismatch_schema"
+                        console.print(
+                            ui.fmt_baseline_schema_mismatch(
+                                baseline_schema=baseline.schema_version,
+                                current_schema=BASELINE_SCHEMA_VERSION,
+                            )
+                        )
+                        baseline_failure_code = 2
+                        baseline_trusted_for_diff = False
+                    if baseline.python_version:
+                        current_version = _current_python_version()
+                        if baseline.python_version != current_version:
+                            if baseline_status == "ok":
+                                baseline_status = "mismatch_python"
+                            console.print(
+                                ui.fmt_baseline_python_mismatch(
+                                    baseline_python=baseline.python_version,
+                                    current_python=current_version,
+                                )
+                            )
+                            if args.fail_on_new:
+                                console.print(ui.ERR_BASELINE_SAME_PYTHON_REQUIRED)
+                                baseline_failure_code = 2
+                                baseline_trusted_for_diff = False
+                    if baseline_status == "ok":
+                        try:
+                            baseline.verify_integrity()
+                        except BaselineValidationError as e:
+                            status = (
+                                e.status
+                                if e.status in _VALID_BASELINE_STATUSES
+                                else "invalid"
+                            )
+                            baseline_status = status
+                            console.print(ui.fmt_invalid_baseline(e))
+                            baseline_trusted_for_diff = False
+                            if args.fail_on_new:
+                                baseline_failure_code = 2
+                            else:
+                                console.print(ui.WARN_BASELINE_IGNORED)
+            if baseline_status in _UNTRUSTED_BASELINE_STATUSES:
+                baseline_loaded = False
+                baseline_trusted_for_diff = False
     else:
         if not args.update_baseline:
-            console.print(
-                "[warning]Baseline file not found at: [bold]"
-                f"{baseline_path}"
-                "[/bold][/warning]\n"
-                "[dim]Comparing against an empty baseline. "
-                "Use --update-baseline to create it.[/dim]"
-            )
+            console.print(ui.fmt_path(ui.WARN_BASELINE_MISSING, baseline_path))
 
     if args.update_baseline:
         new_baseline = Baseline.from_groups(
@@ -511,92 +757,138 @@ def process_sequential(with_progress: bool) -> None:
             block_groups,
             path=baseline_path,
             python_version=f"{sys.version_info.major}.{sys.version_info.minor}",
+            baseline_version=__version__,
+            schema_version=BASELINE_SCHEMA_VERSION,
         )
         new_baseline.save()
-        console.print(f"[success]✔ Baseline updated:[/success] {baseline_path}")
+        console.print(ui.fmt_path(ui.SUCCESS_BASELINE_UPDATED, baseline_path))
+        baseline = new_baseline
+        baseline_loaded = True
+        baseline_status = "ok"
+        baseline_trusted_for_diff = True
         # When updating, we don't fail on new, we just saved the new state.
         # But we might still want to print the summary.
 
+    report_meta = _build_report_meta(
+        baseline_path=baseline_path,
+        baseline=baseline,
+        baseline_loaded=baseline_loaded,
+        baseline_status=baseline_status,
+        cache_path=cache_path.resolve(),
+        cache_used=cache.load_warning is None,
+    )
+
     # Diff
-    new_func, new_block = baseline.diff(func_groups, block_groups)
+    baseline_for_diff = (
+        baseline if baseline_trusted_for_diff else Baseline(baseline_path)
+    )
+    new_func, new_block = baseline_for_diff.diff(func_groups, block_groups)
     new_clones_count = len(new_func) + len(new_block)
 
-    # Summary Table
-    table = Table(title="Analysis Summary", border_style="blue")
-    table.add_column("Metric", style="cyan")
-    table.add_column("Value", style="bold white")
-
-    table.add_row("Files Processed", str(changed_files_count))
-    table.add_row("Total Function Clones", str(func_clones_count))
-    table.add_row("Total Block Clones", str(block_clones_count))
-
-    if baseline_exists:
-        style = "error" if new_clones_count > 0 else "success"
-        table.add_row(
-            "New Clones (vs Baseline)", f"[{style}]{new_clones_count}[/{style}]"
-        )
-
-    console.print(table)
+    _print_summary(
+        quiet=args.quiet,
+        files_found=files_found,
+        files_analyzed=files_analyzed,
+        cache_hits=cache_hits,
+        files_skipped=files_skipped,
+        func_clones_count=func_clones_count,
+        block_clones_count=block_clones_count,
+        segment_clones_count=segment_clones_count,
+        suppressed_segment_groups=suppressed_segment_groups,
+        new_clones_count=new_clones_count,
+    )
 
     # Outputs
-    if args.html_out:
-        out = Path(args.html_out).expanduser().resolve()
+    html_report_path: str | None = None
+    output_notice_printed = False
+
+    def _print_output_notice(message: str) -> None:
+        nonlocal output_notice_printed
+        if args.quiet:
+            return
+        if not output_notice_printed:
+            console.print("")
+            output_notice_printed = True
+        console.print(message)
+
+    if html_out_path:
+        out = html_out_path
         out.parent.mkdir(parents=True, exist_ok=True)
         out.write_text(
             build_html_report(
                 func_groups=func_groups,
                 block_groups=block_groups,
+                segment_groups=segment_groups,
+                report_meta=report_meta,
                 title="CodeClone Report",
                 context_lines=3,
                 max_snippet_lines=220,
             ),
             "utf-8",
         )
-        console.print(f"[info]HTML report saved:[/info] {out}")
+        html_report_path = str(out)
+        _print_output_notice(ui.fmt_path(ui.INFO_HTML_REPORT_SAVED, out))
 
-    if args.json_out:
-        out = Path(args.json_out).expanduser().resolve()
+    if json_out_path:
+        out = json_out_path
         out.parent.mkdir(parents=True, exist_ok=True)
         out.write_text(
-            to_json_report(func_groups, block_groups),
+            to_json_report(func_groups, block_groups, segment_groups, report_meta),
             "utf-8",
         )
-        console.print(f"[info]JSON report saved:[/info] {out}")
+        _print_output_notice(ui.fmt_path(ui.INFO_JSON_REPORT_SAVED, out))
 
-    if args.text_out:
-        out = Path(args.text_out).expanduser().resolve()
+    if text_out_path:
+        out = text_out_path
         out.parent.mkdir(parents=True, exist_ok=True)
         out.write_text(
-            "FUNCTION CLONES\n"
-            + to_text(func_groups)
-            + "\nBLOCK CLONES\n"
-            + to_text(block_groups),
+            to_text_report(
+                meta=report_meta,
+                func_groups=func_groups,
+                block_groups=block_groups,
+                segment_groups=segment_groups,
+            ),
             "utf-8",
         )
-        console.print(f"[info]Text report saved:[/info] {out}")
+        _print_output_notice(ui.fmt_path(ui.INFO_TEXT_REPORT_SAVED, out))
+
+    if baseline_failure_code is not None:
+        sys.exit(baseline_failure_code)
 
     # Exit Codes
     if args.fail_on_new and (new_func or new_block):
-        console.print("\n[error]❌ FAILED: New code clones detected![/error]")
-        if new_func:
-            console.print(f"  New Functions: {', '.join(sorted(new_func))}")
-        if new_block:
-            console.print(f"  New Blocks: {', '.join(sorted(new_block))}")
+        default_report = Path(".cache/codeclone/report.html")
+        if html_report_path is None and default_report.exists():
+            html_report_path = str(default_report)
+
+        console.print(f"\n{ui.FAIL_NEW_TITLE}")
+        console.print(f"\n{ui.FAIL_NEW_SUMMARY_TITLE}")
+        console.print(ui.FAIL_NEW_FUNCTION.format(count=len(new_func)))
+        console.print(ui.FAIL_NEW_BLOCK.format(count=len(new_block)))
+        if html_report_path:
+            console.print(f"\n{ui.FAIL_NEW_REPORT_TITLE}")
+            console.print(f"  {html_report_path}")
+        console.print(f"\n{ui.FAIL_NEW_ACCEPT_TITLE}")
+        console.print(ui.FAIL_NEW_ACCEPT_COMMAND)
+
+        if args.verbose:
+            if new_func:
+                console.print(f"\n{ui.FAIL_NEW_DETAIL_FUNCTION}")
+                for h in sorted(new_func):
+                    console.print(f"- {h}")
+            if new_block:
+                console.print(f"\n{ui.FAIL_NEW_DETAIL_BLOCK}")
+                for h in sorted(new_block):
+                    console.print(f"- {h}")
         sys.exit(3)
 
     if 0 <= args.fail_threshold < (func_clones_count + block_clones_count):
         total = func_clones_count + block_clones_count
-        console.print(
-            f"\n[error]❌ FAILED: Total clones ({total}) "
-            f"exceed threshold ({args.fail_threshold})![/error]"
-        )
+        console.print(ui.fmt_fail_threshold(total=total, threshold=args.fail_threshold))
         sys.exit(2)
 
     if not args.update_baseline and not args.fail_on_new and new_clones_count > 0:
-        console.print(
-            "\n[warning]New clones detected but --fail-on-new not set.[/warning]\n"
-            "Run with --update-baseline to accept them as technical debt."
-        )
+        console.print(ui.WARN_NEW_CLONES_WITHOUT_FAIL)
 
 
 if __name__ == "__main__":
diff --git a/codeclone/errors.py b/codeclone/errors.py
index c2ab463..11e32b8 100644
--- a/codeclone/errors.py
+++ b/codeclone/errors.py
@@ -25,3 +25,17 @@ class ValidationError(CodeCloneError):
 
 class CacheError(CodeCloneError):
     """Cache operation failed."""
+
+
+class BaselineSchemaError(CodeCloneError):
+    """Baseline file structure is invalid."""
+
+
+class BaselineValidationError(BaselineSchemaError):
+    """Baseline validation error with machine-readable status."""
+
+    __slots__ = ("status",)
+
+    def __init__(self, message: str, *, status: str = "invalid") -> None:
+        super().__init__(message)
+        self.status = status
diff --git a/codeclone/extractor.py b/codeclone/extractor.py
index 02f9730..d0a6236 100644
--- a/codeclone/extractor.py
+++ b/codeclone/extractor.py
@@ -15,7 +15,7 @@
 from contextlib import contextmanager
 from dataclasses import dataclass
 
-from .blocks import BlockUnit, extract_blocks
+from .blocks import BlockUnit, SegmentUnit, extract_blocks, extract_segments
 from .cfg import CFGBuilder
 from .errors import ParseError
 from .fingerprint import bucket_loc, sha1
@@ -70,15 +70,14 @@ def _timeout_handler(_signum: int, _frame: object) -> None:
 
             old_limits = resource.getrlimit(resource.RLIMIT_CPU)
             soft, hard = old_limits
-            new_soft = (
-                min(timeout_s, soft) if soft != resource.RLIM_INFINITY else timeout_s
-            )
-            new_hard = (
-                min(timeout_s + 1, hard)
-                if hard != resource.RLIM_INFINITY
-                else timeout_s + 1
-            )
-            resource.setrlimit(resource.RLIMIT_CPU, (new_soft, new_hard))
+            hard_ceiling = timeout_s if hard == resource.RLIM_INFINITY else max(1, hard)
+            if soft == resource.RLIM_INFINITY:
+                new_soft = min(timeout_s, hard_ceiling)
+            else:
+                new_soft = min(timeout_s, soft, hard_ceiling)
+            # Never lower hard limit: raising it back may be disallowed for
+            # unprivileged processes and can lead to process termination later.
+            resource.setrlimit(resource.RLIMIT_CPU, (new_soft, hard))
         except Exception:
             # If resource is unavailable or cannot be set, rely on alarm only.
             pass
@@ -189,7 +188,7 @@ def extract_units_from_source(
     cfg: NormalizationConfig,
     min_loc: int,
     min_stmt: int,
-) -> tuple[list[Unit], list[BlockUnit]]:
+) -> tuple[list[Unit], list[BlockUnit], list[SegmentUnit]]:
     try:
         tree = _parse_with_limits(source, PARSE_TIMEOUT_SECONDS)
     except SyntaxError as e:
@@ -200,6 +199,7 @@ def extract_units_from_source(
 
     units: list[Unit] = []
     block_units: list[BlockUnit] = []
+    segment_units: list[SegmentUnit] = []
 
     for local_name, node in qb.units:
         start = getattr(node, "lineno", None)
@@ -243,4 +243,16 @@ def extract_units_from_source(
             )
             block_units.extend(blocks)
 
-    return units, block_units
+        # Segment-level units (windows within functions, for internal clones)
+        if loc >= 30 and stmt_count >= 12:
+            segments = extract_segments(
+                node,
+                filepath=filepath,
+                qualname=qualname,
+                cfg=cfg,
+                window_size=6,
+                max_segments=60,
+            )
+            segment_units.extend(segments)
+
+    return units, block_units, segment_units
diff --git a/codeclone/html_report.py b/codeclone/html_report.py
index eb23f87..c7ddf36 100644
--- a/codeclone/html_report.py
+++ b/codeclone/html_report.py
@@ -8,247 +8,62 @@
 
 from __future__ import annotations
 
-import html
-import importlib
-import itertools
-from collections.abc import Iterable
-from dataclasses import dataclass
-from functools import lru_cache
-from typing import Any, NamedTuple, cast
-
-from codeclone import __version__
-from codeclone.errors import FileProcessingError
-
+from typing import Any
+
+from . import __version__
+from ._html_escape import _escape_attr, _escape_html, _meta_display
+from ._html_snippets import (
+    _FileCache,
+    _prefix_css,
+    _pygments_css,
+    _render_code_block,
+    _try_pygments,
+    pairwise,
+)
 from .templates import FONT_CSS_URL, REPORT_TEMPLATE
 
-# ============================
-# Pairwise
-# ============================
-
-
-def pairwise(iterable: Iterable[Any]) -> Iterable[tuple[Any, Any]]:
-    a, b = itertools.tee(iterable)
-    next(b, None)
-    return zip(a, b, strict=False)
-
-
-# ============================
-# Code snippet infrastructure
-# ============================
-
-
-@dataclass(slots=True)
-class _Snippet:
-    filepath: str
-    start_line: int
-    end_line: int
-    code_html: str
-
-
-class _FileCache:
-    __slots__ = ("_get_lines_impl", "maxsize")
-
-    def __init__(self, maxsize: int = 128) -> None:
-        self.maxsize = maxsize
-        # Create a bound method with lru_cache
-        # We need to cache on the method to have instance-level caching if we wanted
-        # different caches per instance. But lru_cache on method actually caches
-        # on the function object (class level) if not careful,
-        # or we use a wrapper.
-        # However, for this script, we usually have one reporter.
-        # To be safe and cleaner, we can use a method that delegates to a cached
-        # function, OR just use lru_cache on a method (which requires 'self' to be
-        # hashable, which it is by default id).
-        # But 'self' changes if we create new instances.
-        # Let's use the audit's pattern: cache the implementation.
-
-        self._get_lines_impl = lru_cache(maxsize=maxsize)(self._read_file_range)
-
-    def _read_file_range(
-        self, filepath: str, start_line: int, end_line: int
-    ) -> tuple[str, ...]:
-        if start_line < 1:
-            start_line = 1
-        if end_line < start_line:
-            return ()
-
-        try:
-
-            def _read_with_errors(errors: str) -> tuple[str, ...]:
-                lines: list[str] = []
-                with open(filepath, encoding="utf-8", errors=errors) as f:
-                    for lineno, line in enumerate(f, start=1):
-                        if lineno < start_line:
-                            continue
-                        if lineno > end_line:
-                            break
-                        lines.append(line.rstrip("\n"))
-                return tuple(lines)
-
-            try:
-                return _read_with_errors("strict")
-            except UnicodeDecodeError:
-                return _read_with_errors("replace")
-        except OSError as e:
-            raise FileProcessingError(f"Cannot read {filepath}: {e}") from e
-
-    def get_lines_range(
-        self, filepath: str, start_line: int, end_line: int
-    ) -> tuple[str, ...]:
-        return self._get_lines_impl(filepath, start_line, end_line)
-
-    class _CacheInfo(NamedTuple):
-        hits: int
-        misses: int
-        maxsize: int | None
-        currsize: int
-
-    def cache_info(self) -> _CacheInfo:
-        return cast(_FileCache._CacheInfo, self._get_lines_impl.cache_info())
-
-
-def _try_pygments(code: str) -> str | None:
-    try:
-        pygments = importlib.import_module("pygments")
-        formatters = importlib.import_module("pygments.formatters")
-        lexers = importlib.import_module("pygments.lexers")
-    except Exception:
-        return None
-
-    highlight = pygments.highlight
-    formatter_cls = formatters.HtmlFormatter
-    lexer_cls = lexers.PythonLexer
-    result = highlight(code, lexer_cls(), formatter_cls(nowrap=True))
-    return result if isinstance(result, str) else None
-
-
-def _pygments_css(style_name: str) -> str:
-    """
-    Returns CSS for pygments tokens. Scoped to `.codebox` to avoid leaking styles.
-    If Pygments is not available or style missing, returns "".
-    """
-    try:
-        formatters = importlib.import_module("pygments.formatters")
-    except Exception:
-        return ""
-
-    try:
-        formatter_cls = formatters.HtmlFormatter
-        fmt = formatter_cls(style=style_name)
-    except Exception:
-        try:
-            fmt = formatter_cls()
-        except Exception:
-            return ""
-
-    try:
-        # `.codebox` scope: pygments will emit selectors like `.codebox .k { ... }`
-        css = fmt.get_style_defs(".codebox")
-        return css if isinstance(css, str) else ""
-    except Exception:
-        return ""
-
-
-def _prefix_css(css: str, prefix: str) -> str:
-    """
-    Prefix every selector block with `prefix `.
-    Safe enough for pygments CSS which is mostly selector blocks and comments.
-    """
-    out_lines: list[str] = []
-    for line in css.splitlines():
-        stripped = line.strip()
-        if not stripped:
-            out_lines.append(line)
-            continue
-        if stripped.startswith(("/*", "*", "*/")):
-            out_lines.append(line)
-            continue
-        # Selector lines usually end with `{
-        if "{" in line:
-            # naive prefix: split at "{", prefix selector part
-            before, after = line.split("{", 1)
-            sel = before.strip()
-            if sel:
-                out_lines.append(f"{prefix} {sel} {{ {after}".rstrip())
-            else:
-                out_lines.append(line)
-        else:
-            out_lines.append(line)
-    return "\n".join(out_lines)
-
-
-def _render_code_block(
-    *,
-    filepath: str,
-    start_line: int,
-    end_line: int,
-    file_cache: _FileCache,
-    context: int,
-    max_lines: int,
-) -> _Snippet:
-    s = max(1, start_line - context)
-    e = end_line + context
-
-    if e - s + 1 > max_lines:
-        e = s + max_lines - 1
-
-    lines = file_cache.get_lines_range(filepath, s, e)
-
-    numbered: list[tuple[bool, str]] = []
-    for lineno, line in enumerate(lines, start=s):
-        hit = start_line <= lineno <= end_line
-        numbered.append((hit, f"{lineno:>5} | {line.rstrip()}"))
-
-    raw = "\n".join(text for _, text in numbered)
-    highlighted = _try_pygments(raw)
-
-    if highlighted is None:
-        rendered: list[str] = []
-        for hit, text in numbered:
-            cls = "hitline" if hit else "line"
-            rendered.append(f'<div class="{cls}">{html.escape(text)}</div>')
-        body = "\n".join(rendered)
-    else:
-        body = highlighted
-
-    return _Snippet(
-        filepath=filepath,
-        start_line=start_line,
-        end_line=end_line,
-        code_html=f'<div class="codebox"><pre><code>{body}</code></pre></div>',
-    )
-
+__all__ = [
+    "_FileCache",
+    "_prefix_css",
+    "_pygments_css",
+    "_render_code_block",
+    "_try_pygments",
+    "build_html_report",
+    "pairwise",
+]
 
 # ============================
 # HTML report builder
 # ============================
 
 
-def _escape(v: Any) -> str:
-    return html.escape("" if v is None else str(v))
-
-
-def _group_sort_key(items: list[dict[str, Any]]) -> tuple[int, int]:
-    return (
-        -len(items),
-        -max(int(i.get("loc") or i.get("size") or 0) for i in items),
-    )
+def _group_sort_key(items: list[dict[str, Any]]) -> tuple[int]:
+    return (-len(items),)
 
 
 def build_html_report(
     *,
     func_groups: dict[str, list[dict[str, Any]]],
     block_groups: dict[str, list[dict[str, Any]]],
+    segment_groups: dict[str, list[dict[str, Any]]],
+    report_meta: dict[str, Any] | None = None,
     title: str = "CodeClone Report",
     context_lines: int = 3,
     max_snippet_lines: int = 220,
 ) -> str:
     file_cache = _FileCache()
 
-    func_sorted = sorted(func_groups.items(), key=lambda kv: _group_sort_key(kv[1]))
-    block_sorted = sorted(block_groups.items(), key=lambda kv: _group_sort_key(kv[1]))
+    func_sorted = sorted(
+        func_groups.items(), key=lambda kv: (*_group_sort_key(kv[1]), kv[0])
+    )
+    block_sorted = sorted(
+        block_groups.items(), key=lambda kv: (*_group_sort_key(kv[1]), kv[0])
+    )
+    segment_sorted = sorted(
+        segment_groups.items(), key=lambda kv: (*_group_sort_key(kv[1]), kv[0])
+    )
 
-    has_any = bool(func_sorted) or bool(block_sorted)
+    has_any = bool(func_sorted) or bool(block_sorted) or bool(segment_sorted)
 
     # Pygments CSS (scoped). Use modern GitHub-like styles when available.
     # We scope per theme to support toggle without reloading.
@@ -265,64 +80,60 @@ def build_html_report(
     # ============================
     # Icons (Inline SVG)
     # ============================
-    ICON_SEARCH = (
-        '<svg width="16" height="16" viewBox="0 0 24 24" fill="none" '
-        'stroke="currentColor" stroke-width="2.5" stroke-linecap="round" '
-        'stroke-linejoin="round">'
-        '<circle cx="11" cy="11" r="8"></circle>'
-        '<line x1="21" y1="21" x2="16.65" y2="16.65"></line>'
-        "</svg>"
-    )
-    ICON_X = (
-        '<svg width="16" height="16" viewBox="0 0 24 24" fill="none" '
-        'stroke="currentColor" stroke-width="2.5" stroke-linecap="round" '
-        'stroke-linejoin="round">'
-        '<line x1="18" y1="6" x2="6" y2="18"></line>'
-        '<line x1="6" y1="6" x2="18" y2="18"></line>'
-        "</svg>"
-    )
-    ICON_CHEV_DOWN = (
-        '<svg width="16" height="16" viewBox="0 0 24 24" fill="none" '
-        'stroke="currentColor" stroke-width="2.5" stroke-linecap="round" '
-        'stroke-linejoin="round">'
-        '<polyline points="6 9 12 15 18 9"></polyline>'
-        "</svg>"
-    )
-    # ICON_CHEV_RIGHT = (
-    #     '<svg width="16" height="16" viewBox="0 0 24 24" fill="none" '
-    #     'stroke="currentColor" stroke-width="2.5" stroke-linecap="round" '
-    #     'stroke-linejoin="round">'
-    #     '<polyline points="9 18 15 12 9 6"></polyline>'
-    #     "</svg>"
-    # )
-    ICON_THEME = (
-        '<svg width="16" height="16" viewBox="0 0 24 24" fill="none" '
-        'stroke="currentColor" stroke-width="2" stroke-linecap="round" '
-        'stroke-linejoin="round">'
-        '<path d="M21 12.79A9 9 0 1 1 11.21 3 7 7 0 0 0 21 12.79z"></path>'
-        "</svg>"
-    )
-    ICON_CHECK = (
-        '<svg width="48" height="48" viewBox="0 0 24 24" fill="none" '
-        'stroke="currentColor" stroke-width="2" stroke-linecap="round" '
-        'stroke-linejoin="round">'
-        '<polyline points="20 6 9 17 4 12"></polyline>'
-        "</svg>"
-    )
-    ICON_PREV = (
-        '<svg width="16" height="16" viewBox="0 0 24 24" fill="none" '
-        'stroke="currentColor" stroke-width="2" stroke-linecap="round" '
-        'stroke-linejoin="round">'
-        '<polyline points="15 18 9 12 15 6"></polyline>'
-        "</svg>"
-    )
-    ICON_NEXT = (
-        '<svg width="16" height="16" viewBox="0 0 24 24" fill="none" '
-        'stroke="currentColor" stroke-width="2" stroke-linecap="round" '
-        'stroke-linejoin="round">'
-        '<polyline points="9 18 15 12 9 6"></polyline>'
-        "</svg>"
-    )
+    def _svg_icon(size: int, stroke_width: str, body: str) -> str:
+        return (
+            f'<svg width="{size}" height="{size}" viewBox="0 0 24 24" fill="none" '
+            f'stroke="currentColor" stroke-width="{stroke_width}" '
+            'stroke-linecap="round" stroke-linejoin="round">'
+            f"{body}</svg>"
+        )
+
+    ICONS = {
+        "search": _svg_icon(
+            16,
+            "2.5",
+            '<circle cx="11" cy="11" r="8"></circle>'
+            '<line x1="21" y1="21" x2="16.65" y2="16.65"></line>',
+        ),
+        "clear": _svg_icon(
+            16,
+            "2.5",
+            '<line x1="18" y1="6" x2="6" y2="18"></line>'
+            '<line x1="6" y1="6" x2="18" y2="18"></line>',
+        ),
+        "chev_down": _svg_icon(
+            16,
+            "2.5",
+            '<polyline points="6 9 12 15 18 9"></polyline>',
+        ),
+        # ICON_CHEV_RIGHT = (
+        #     '<svg width="16" height="16" viewBox="0 0 24 24" fill="none" '
+        #     'stroke="currentColor" stroke-width="2.5" stroke-linecap="round" '
+        #     'stroke-linejoin="round">'
+        #     '<polyline points="9 18 15 12 9 6"></polyline>'
+        #     "</svg>"
+        # )
+        "theme": _svg_icon(
+            16,
+            "2",
+            '<path d="M21 12.79A9 9 0 1 1 11.21 3 7 7 0 0 0 21 12.79z"></path>',
+        ),
+        "check": _svg_icon(
+            48,
+            "2",
+            '<polyline points="20 6 9 17 4 12"></polyline>',
+        ),
+        "prev": _svg_icon(
+            16,
+            "2",
+            '<polyline points="15 18 9 12 15 6"></polyline>',
+        ),
+        "next": _svg_icon(
+            16,
+            "2",
+            '<polyline points="9 18 15 12 9 6"></polyline>',
+        ),
+    }
 
     # ----------------------------
     # Section renderer
@@ -341,16 +152,16 @@ def render_section(
         out: list[str] = [
             f'<section id="{section_id}" class="section" data-section="{section_id}">',
             '<div class="section-head">',
-            f"<h2>{_escape(section_title)} "
+            f"<h2>{_escape_html(section_title)} "
             f'<span class="pill {pill_cls}" data-count-pill="{section_id}">'
             f"{len(groups)} groups</span></h2>",
             f"""
 <div class="section-toolbar"
      role="toolbar"
-     aria-label="{_escape(section_title)} controls">
+     aria-label="{_escape_attr(section_title)} controls">
   <div class="toolbar-left">
     <div class="search-wrap">
-      <span class="search-ico">{ICON_SEARCH}</span>
+      <span class="search-ico">{ICONS["search"]}</span>
       <input class="search"
              id="search-{section_id}"
              placeholder="Search..."
@@ -358,7 +169,7 @@ def render_section(
       <button class="btn ghost"
               type="button"
               data-clear="{section_id}"
-              title="Clear search">{ICON_X}</button>
+              title="Clear search">{ICONS["clear"]}</button>
     </div>
     <div class="segmented">
       <button class="btn seg"
@@ -374,11 +185,11 @@ def render_section(
     <div class="pager">
       <button class="btn"
               type="button"
-              data-prev="{section_id}">{ICON_PREV}</button>
+              data-prev="{section_id}">{ICONS["prev"]}</button>
       <span class="page-meta" data-page-meta="{section_id}">Page 1</span>
       <button class="btn"
               type="button"
-              data-next="{section_id}">{ICON_NEXT}</button>
+              data-next="{section_id}">{ICONS["next"]}</button>
     </div>
     <select class="select" data-pagesize="{section_id}" title="Groups per page">
       <option value="5">5 / page</option>
@@ -399,10 +210,12 @@ def render_section(
                 search_parts.append(str(it.get("qualname", "")))
                 search_parts.append(str(it.get("filepath", "")))
             search_blob = " ".join(search_parts).lower()
-            search_blob_escaped = html.escape(search_blob, quote=True)
+            search_blob_escaped = _escape_attr(search_blob)
 
             out.append(
                 f'<div class="group" data-group="{section_id}" '
+                f'data-group-index="{idx}" '
+                f'data-group-key="{_escape_attr(gkey)}" '
                 f'data-search="{search_blob_escaped}">'
             )
 
@@ -410,22 +223,24 @@ def render_section(
                 '<div class="group-head">'
                 '<div class="group-left">'
                 f'<button class="chev" type="button" aria-label="Toggle group" '
-                f'data-toggle-group="{section_id}-{idx}">{ICON_CHEV_DOWN}</button>'
+                f'data-toggle-group="{section_id}-{idx}">{ICONS["chev_down"]}</button>'
                 f'<div class="group-title">Group #{idx}</div>'
                 f'<span class="pill small {pill_cls}">{len(items)} items</span>'
                 "</div>"
                 '<div class="group-right">'
-                f'<code class="gkey">{_escape(gkey)}</code>'
+                f'<code class="gkey" title="{_escape_attr(gkey)}">'
+                f"{_escape_html(gkey)}</code>"
                 "</div>"
                 "</div>"
             )
 
             out.append(f'<div class="items" id="group-body-{section_id}-{idx}">')
 
-            for a, b in pairwise(items):
+            for i in range(0, len(items), 2):
+                row_items = items[i : i + 2]
                 out.append('<div class="item-pair">')
 
-                for item in (a, b):
+                for item in row_items:
                     snippet = _render_code_block(
                         filepath=item["filepath"],
                         start_line=int(item["start_line"]),
@@ -435,12 +250,22 @@ def render_section(
                         max_lines=max_snippet_lines,
                     )
 
+                    qualname = _escape_html(item["qualname"])
+                    qualname_attr = _escape_attr(item["qualname"])
+                    filepath = _escape_html(item["filepath"])
+                    filepath_attr = _escape_attr(item["filepath"])
+                    start_line = int(item["start_line"])
+                    end_line = int(item["end_line"])
                     out.append(
-                        '<div class="item">'
-                        f'<div class="item-head">{_escape(item["qualname"])}</div>'
-                        f'<div class="item-file">'
-                        f"{_escape(item['filepath'])}:"
-                        f"{item['start_line']}-{item['end_line']}"
+                        f'<div class="item" data-qualname="{qualname_attr}" '
+                        f'data-filepath="{filepath_attr}" '
+                        f'data-start-line="{start_line}" '
+                        f'data-end-line="{end_line}">'
+                        f'<div class="item-head" title="{qualname_attr}">'
+                        f"{qualname}</div>"
+                        f'<div class="item-file" '
+                        f'title="{filepath_attr}:{start_line}-{end_line}">'
+                        f"{filepath}:{start_line}-{end_line}"
                         f"</div>"
                         f"{snippet.code_html}"
                         "</div>"
@@ -464,10 +289,11 @@ def render_section(
         empty_state_html = f"""
 <div class="empty">
   <div class="empty-card">
-    <div class="empty-icon">{ICON_CHECK}</div>
+    <div class="empty-icon">{ICONS["check"]}</div>
     <h2>No code clones detected</h2>
     <p>
-      No structural or block-level duplication was found above configured thresholds.
+      No structural, block-level, or segment-level duplication was found above
+      configured thresholds.
     </p>
     <p class="muted">This usually indicates healthy abstraction boundaries.</p>
   </div>
@@ -478,15 +304,131 @@ def render_section(
         "functions", "Function clones", func_sorted, "pill-func"
     )
     block_section = render_section("blocks", "Block clones", block_sorted, "pill-block")
+    segment_section = render_section(
+        "segments", "Segment clones", segment_sorted, "pill-segment"
+    )
+
+    meta = dict(report_meta or {})
+    meta_rows: list[tuple[str, Any]] = [
+        ("CodeClone", meta.get("codeclone_version", __version__)),
+        ("Python", meta.get("python_version")),
+        ("Baseline", meta.get("baseline_path")),
+        ("Baseline version", meta.get("baseline_version")),
+        ("Baseline schema", meta.get("baseline_schema_version")),
+        ("Baseline Python", meta.get("baseline_python_version")),
+        ("Baseline loaded", meta.get("baseline_loaded")),
+        ("Baseline status", meta.get("baseline_status")),
+    ]
+    if "cache_path" in meta:
+        meta_rows.append(("Cache path", meta.get("cache_path")))
+    if "cache_used" in meta:
+        meta_rows.append(("Cache used", meta.get("cache_used")))
+
+    meta_attrs = " ".join(
+        [
+            (
+                'data-codeclone-version="'
+                f'{_escape_attr(meta.get("codeclone_version", __version__))}"'
+            ),
+            f'data-python-version="{_escape_attr(meta.get("python_version"))}"',
+            f'data-baseline-path="{_escape_attr(meta.get("baseline_path"))}"',
+            f'data-baseline-version="{_escape_attr(meta.get("baseline_version"))}"',
+            f'data-baseline-schema-version="{_escape_attr(meta.get("baseline_schema_version"))}"',
+            f'data-baseline-python-version="{_escape_attr(meta.get("baseline_python_version"))}"',
+            f'data-baseline-loaded="{_escape_attr(_meta_display(meta.get("baseline_loaded")))}"',
+            f'data-baseline-status="{_escape_attr(meta.get("baseline_status"))}"',
+            f'data-cache-path="{_escape_attr(meta.get("cache_path"))}"',
+            f'data-cache-used="{_escape_attr(_meta_display(meta.get("cache_used")))}"',
+        ]
+    )
+
+    def _meta_row_class(label: str) -> str:
+        if label in {"Baseline", "Cache path"}:
+            return "meta-row meta-row-wide"
+        return "meta-row"
+
+    def _is_path_field(label: str) -> bool:
+        """Check if field contains a file path."""
+        return label in {"Baseline", "Cache path"}
+
+    def _is_bool_field(label: str) -> bool:
+        """Check if field contains a boolean value."""
+        return label in {"Baseline loaded", "Cache used"}
+
+    def _format_meta_value(label: str, value: Any) -> str:
+        """Format meta value with appropriate styling."""
+        display_val = _meta_display(value)
+
+        # Boolean fields with badge styling
+        if _is_bool_field(label):
+            if isinstance(value, bool):
+                badge_class = "meta-bool-true" if value else "meta-bool-false"
+                badge_text = "true" if value else "false"
+                return f'<span class="meta-bool {badge_class}">{badge_text}</span>'
+            else:
+                return '<span class="meta-bool meta-bool-na">n/a</span>'
+
+        # Path fields with tooltip on hover
+        if _is_path_field(label) and display_val != "n/a":
+            escaped_path = _escape_html(display_val)
+            return (
+                f'<span class="meta-path">'
+                f"{escaped_path}"
+                f'<span class="meta-path-tooltip">{escaped_path}</span>'
+                f"</span>"
+            )
+
+        # Regular fields
+        return _escape_html(display_val)
+
+    meta_rows_html = "".join(
+        (
+            f'<div class="{_meta_row_class(label)}">'
+            f"<dt>{_escape_html(label)}</dt>"
+            f"<dd>{_format_meta_value(label, value)}</dd>"
+            "</div>"
+        )
+        for label, value in meta_rows
+    )
+
+    # Chevron icon for toggle
+    chevron_icon = (
+        '<svg class="icon" fill="none" stroke="currentColor" viewBox="0 0 24 24">'
+        '<path stroke-linecap="round" stroke-linejoin="round" stroke-width="2" '
+        'd="M19 9l-7 7-7-7"/>'
+        "</svg>"
+    )
+
+    # Count non-n/a fields for badge
+    non_na_count = sum(1 for _, val in meta_rows if _meta_display(val) != "n/a")
+
+    report_meta_html = (
+        f'<section class="meta-panel" id="report-meta" {meta_attrs}>'
+        '<div class="meta-header">'
+        '<div class="meta-header-left">'
+        f'<div class="meta-toggle">{chevron_icon}</div>'
+        '<h3 class="meta-title">Report Provenance</h3>'
+        f'<span class="meta-badge">{non_na_count} fields</span>'
+        "</div>"
+        "</div>"
+        '<div class="meta-content">'
+        '<div class="meta-body">'
+        f'<dl class="meta-grid">{meta_rows_html}</dl>'
+        "</div>"
+        "</div>"
+        "</section>"
+    )
 
     return REPORT_TEMPLATE.substitute(
-        title=_escape(title),
+        title=_escape_html(title),
         version=__version__,
         pyg_dark=pyg_dark,
         pyg_light=pyg_light,
+        report_meta_html=report_meta_html,
         empty_state_html=empty_state_html,
         func_section=func_section,
         block_section=block_section,
-        icon_theme=ICON_THEME,
+        segment_section=segment_section,
+        icon_theme=ICONS["theme"],
         font_css_url=FONT_CSS_URL,
     )
diff --git a/codeclone/meta_markers.py b/codeclone/meta_markers.py
new file mode 100644
index 0000000..cc9197f
--- /dev/null
+++ b/codeclone/meta_markers.py
@@ -0,0 +1,13 @@
+"""
+CodeClone — AST and CFG-based code clone detector for Python
+focused on architectural duplication.
+
+Copyright (c) 2026 Den Rozhnovskiy
+Licensed under the MIT License.
+"""
+
+from __future__ import annotations
+
+# Contains `:` characters, so it cannot be produced by valid Python identifiers
+# from parsed source code. It is only emitted programmatically by CFG builder.
+CFG_META_PREFIX = "__CC_META__::"
diff --git a/codeclone/normalize.py b/codeclone/normalize.py
index d78f0e0..67e5eef 100644
--- a/codeclone/normalize.py
+++ b/codeclone/normalize.py
@@ -13,6 +13,9 @@
 from ast import AST
 from collections.abc import Sequence
 from dataclasses import dataclass
+from typing import cast
+
+from .meta_markers import CFG_META_PREFIX
 
 
 @dataclass(frozen=True, slots=True)
@@ -71,7 +74,8 @@ def visit_arg(self, node: ast.arg) -> ast.arg:
         return node
 
     def visit_Name(self, node: ast.Name) -> ast.Name:
-        if self.cfg.normalize_names:
+        # Call targets are handled in visit_Call to avoid erasing callee symbols.
+        if self.cfg.normalize_names and not _is_semantic_marker_name(node.id):
             node.id = "_VAR_"
         return node
 
@@ -87,6 +91,26 @@ def visit_Constant(self, node: ast.Constant) -> ast.Constant:
             node.value = "_CONST_"
         return node
 
+    def visit_Call(self, node: ast.Call) -> ast.Call:
+        node.func = self._visit_call_target(node.func)
+        node.args = [cast(ast.expr, self.visit(arg)) for arg in node.args]
+        for kw in node.keywords:
+            kw.value = cast(ast.expr, self.visit(kw.value))
+        return node
+
+    def _visit_call_target(self, node: ast.expr) -> ast.expr:
+        # Keep symbolic call targets intact to avoid conflating different APIs.
+        if isinstance(node, ast.Name):
+            return node
+        if isinstance(node, ast.Attribute):
+            value = node.value
+            if isinstance(value, (ast.Name, ast.Attribute)):
+                node.value = self._visit_call_target(value)
+            else:
+                node.value = cast(ast.expr, self.visit(value))
+            return node
+        return cast(ast.expr, self.visit(node))
+
     def visit_AugAssign(self, node: ast.AugAssign) -> AST:
         # Normalize x += 1 to x = x + 1
         # This allows detecting clones where one uses += and another uses = +
@@ -109,6 +133,81 @@ def visit_AugAssign(self, node: ast.AugAssign) -> AST:
         )
         return self.generic_visit(new_node)
 
+    def visit_UnaryOp(self, node: ast.UnaryOp) -> ast.AST:
+        new_node = self.generic_visit(node)
+        assert isinstance(new_node, ast.UnaryOp)
+
+        if isinstance(new_node.op, ast.Not):
+            operand = new_node.operand
+            if (
+                isinstance(operand, ast.Compare)
+                and len(operand.ops) == 1
+                and len(operand.comparators) == 1
+            ):
+                op = operand.ops[0]
+                if isinstance(op, ast.In):
+                    cmp = ast.Compare(
+                        left=operand.left,
+                        ops=[ast.NotIn()],
+                        comparators=operand.comparators,
+                    )
+                    return ast.copy_location(cmp, new_node)
+                if isinstance(op, ast.Is):
+                    cmp = ast.Compare(
+                        left=operand.left,
+                        ops=[ast.IsNot()],
+                        comparators=operand.comparators,
+                    )
+                    return ast.copy_location(cmp, new_node)
+        return new_node
+
+    def visit_BinOp(self, node: ast.BinOp) -> ast.AST:
+        new_node = self.generic_visit(node)
+        assert isinstance(new_node, ast.BinOp)
+
+        if not isinstance(
+            new_node.op, (ast.Add, ast.Mult, ast.BitOr, ast.BitAnd, ast.BitXor)
+        ):
+            return new_node
+
+        if not (
+            _is_proven_commutative_operand(new_node.left, new_node.op)
+            and _is_proven_commutative_operand(new_node.right, new_node.op)
+        ):
+            return new_node
+
+        left_key = _expr_sort_key(new_node.left)
+        right_key = _expr_sort_key(new_node.right)
+        if right_key < left_key:
+            new_node.left, new_node.right = new_node.right, new_node.left
+        return new_node
+
+
+def _expr_sort_key(node: ast.AST) -> str:
+    return ast.dump(node, annotate_fields=True, include_attributes=False)
+
+
+def _is_semantic_marker_name(name: str) -> bool:
+    return name.startswith(CFG_META_PREFIX)
+
+
+def _is_proven_commutative_operand(node: ast.AST, op: ast.operator) -> bool:
+    if isinstance(node, ast.Constant):
+        return _is_proven_commutative_constant(node.value, op)
+    if isinstance(node, ast.BinOp) and type(node.op) is type(op):
+        return _is_proven_commutative_operand(
+            node.left, op
+        ) and _is_proven_commutative_operand(node.right, op)
+    return False
+
+
+def _is_proven_commutative_constant(value: object, op: ast.operator) -> bool:
+    if isinstance(op, (ast.BitOr, ast.BitAnd, ast.BitXor)):
+        return isinstance(value, int) and not isinstance(value, bool)
+    if isinstance(op, (ast.Add, ast.Mult)):
+        return isinstance(value, (int, float, complex)) and not isinstance(value, bool)
+    return False
+
 
 def normalized_ast_dump(func_node: ast.AST, cfg: NormalizationConfig) -> str:
     """
diff --git a/codeclone/report.py b/codeclone/report.py
index 04a83bd..99fa6d2 100644
--- a/codeclone/report.py
+++ b/codeclone/report.py
@@ -8,71 +8,49 @@
 
 from __future__ import annotations
 
-import json
-from typing import Any
-
-GroupItem = dict[str, Any]
-GroupMap = dict[str, list[GroupItem]]
-
-
-def build_groups(units: list[GroupItem]) -> GroupMap:
-    groups: GroupMap = {}
-    for u in units:
-        key = f"{u['fingerprint']}|{u['loc_bucket']}"
-        groups.setdefault(key, []).append(u)
-    return {k: v for k, v in groups.items() if len(v) > 1}
-
-
-def build_block_groups(blocks: list[GroupItem], min_functions: int = 2) -> GroupMap:
-    groups: GroupMap = {}
-    for b in blocks:
-        groups.setdefault(b["block_hash"], []).append(b)
-
-    filtered: GroupMap = {}
-    for h, items in groups.items():
-        functions = {i["qualname"] for i in items}
-        if len(functions) >= min_functions:
-            filtered[h] = items
-
-    return filtered
-
-
-def to_json(groups: GroupMap) -> str:
-    return json.dumps(
-        {
-            "group_count": len(groups),
-            "groups": [
-                {"key": k, "count": len(v), "items": v}
-                for k, v in sorted(
-                    groups.items(), key=lambda kv: len(kv[1]), reverse=True
-                )
-            ],
-        },
-        ensure_ascii=False,
-        indent=2,
-    )
-
-
-def to_json_report(func_groups: GroupMap, block_groups: GroupMap) -> str:
-    return json.dumps(
-        {"functions": func_groups, "blocks": block_groups},
-        ensure_ascii=False,
-        indent=2,
-    )
-
-
-def to_text(groups: GroupMap) -> str:
-    lines: list[str] = []
-    for i, (_, v) in enumerate(
-        sorted(groups.items(), key=lambda kv: len(kv[1]), reverse=True)
-    ):
-        lines.append(f"\n=== Clone group #{i + 1} (count={len(v)}) ===")
-        lines.extend(
-            [
-                f"- {item['qualname']} "
-                f"{item['filepath']}:{item['start_line']}-{item['end_line']} "
-                f"loc={item.get('loc', item.get('size'))}"
-                for item in v
-            ]
-        )
-    return "\n".join(lines).strip() + "\n"
+from ._report_grouping import build_block_groups, build_groups, build_segment_groups
+from ._report_segments import (
+    _CONTROL_FLOW_STMTS,
+    _FORBIDDEN_STMTS,
+    SEGMENT_MIN_UNIQUE_STMT_TYPES,
+    _analyze_segment_statements,
+    _assign_targets_attribute_only,
+    _collect_file_functions,
+    _merge_segment_items,
+    _QualnameCollector,
+    _segment_statements,
+    _SegmentAnalysis,
+    prepare_segment_report_groups,
+)
+from ._report_serialize import (
+    _format_meta_text_value,
+    to_json,
+    to_json_report,
+    to_text,
+    to_text_report,
+)
+from ._report_types import GroupItem, GroupMap
+
+__all__ = [
+    "SEGMENT_MIN_UNIQUE_STMT_TYPES",
+    "_CONTROL_FLOW_STMTS",
+    "_FORBIDDEN_STMTS",
+    "GroupItem",
+    "GroupMap",
+    "_QualnameCollector",
+    "_SegmentAnalysis",
+    "_analyze_segment_statements",
+    "_assign_targets_attribute_only",
+    "_collect_file_functions",
+    "_format_meta_text_value",
+    "_merge_segment_items",
+    "_segment_statements",
+    "build_block_groups",
+    "build_groups",
+    "build_segment_groups",
+    "prepare_segment_report_groups",
+    "to_json",
+    "to_json_report",
+    "to_text",
+    "to_text_report",
+]
diff --git a/codeclone/scanner.py b/codeclone/scanner.py
index db34202..b2421bf 100644
--- a/codeclone/scanner.py
+++ b/codeclone/scanner.py
@@ -78,7 +78,7 @@ def iter_py_files(
                 raise ValidationError(f"Cannot scan under sensitive directory: {root}")
 
     file_count = 0
-    for p in rootp.rglob("*.py"):
+    for p in sorted(rootp.rglob("*.py"), key=lambda path: str(path)):
         # Verify path is actually under root (prevent symlink attacks)
         try:
             p.resolve().relative_to(rootp)
diff --git a/codeclone/templates.py b/codeclone/templates.py
index d8870e0..3880e1a 100644
--- a/codeclone/templates.py
+++ b/codeclone/templates.py
@@ -6,205 +6,181 @@
 Licensed under the MIT License.
 """
 
+from __future__ import annotations
+
 from string import Template
 
 FONT_CSS_URL = (
-    "https://fonts.googleapis.com/css2?family=Inter:wght@300;400;500;600;700"
-    "&family=JetBrains+Mono:wght@400;500;600&display=swap"
+    "https://fonts.googleapis.com/css2?"
+    "family=Inter:wght@400;500;600;700&"
+    "family=JetBrains+Mono:wght@400;500&"
+    "display=swap"
 )
 
-REPORT_TEMPLATE = Template(r"""
-<!doctype html>
+REPORT_TEMPLATE = Template(
+    r"""<!doctype html>
 <html lang="en" data-theme="dark">
 <head>
 <meta charset="utf-8">
 <meta name="viewport" content="width=device-width, initial-scale=1">
 <title>${title}</title>
-
-<!-- Fonts -->
 <link rel="preconnect" href="https://fonts.googleapis.com">
 <link rel="preconnect" href="https://fonts.gstatic.com" crossorigin>
 <link href="${font_css_url}" rel="stylesheet">
 
 <style>
 /* ============================
-   CodeClone UI/UX
+   CodeClone UI
    ============================ */
 
-/* ========== Design Tokens ========== */
 :root {
-  /* Brand Colors - Purple/Cyan Identity */
-  --brand-purple: #8B5CF6;
-  --brand-cyan: #06B6D4;
-  --brand-pink: #EC4899;
-  --brand-amber: #F59E0B;
-
-  /* Surface Hierarchy */
-  --surface-0: #0A0A0F;
-  --surface-1: #141419;
-  --surface-2: #1E1E24;
-  --surface-3: #28282F;
-  --surface-4: #32323A;
-
-  /* Text */
-  --text-primary: #F9FAFB;
+  /* Neutral Palette */
+  --surface-0: #0E1117;
+  --surface-1: #161B22;
+  --surface-2: #1F2937;
+  --surface-3: #374151;
+  --surface-4: #4B5563;
+
+  --text-primary: #F3F4F6;
   --text-secondary: #D1D5DB;
   --text-tertiary: #9CA3AF;
   --text-muted: #6B7280;
 
-  /* Borders */
-  --border-subtle: #2D2D35;
-  --border-default: #3F3F46;
-  --border-strong: #52525B;
+  --border-subtle: #1F2937;
+  --border-default: #374151;
+  --border-strong: #4B5563;
 
-  /* Semantic */
+  /* Refined Accent - Blue */
+  --accent-primary: #3B82F6;
+  --accent-secondary: #60A5FA;
+  --accent-subtle: rgba(59, 130, 246, 0.1);
+  --accent-muted: rgba(59, 130, 246, 0.05);
+
+  /* Semantic Colors - Muted & Professional */
   --success: #10B981;
+  --success-subtle: rgba(16, 185, 129, 0.1);
   --warning: #F59E0B;
+  --warning-subtle: rgba(245, 158, 11, 0.1);
   --error: #EF4444;
+  --error-subtle: rgba(239, 68, 68, 0.1);
   --info: #3B82F6;
+  --info-subtle: rgba(59, 130, 246, 0.1);
 
-  /* Gradients */
-  --gradient-primary: linear-gradient(
-    135deg,
-    var(--brand-purple) 0%,
-    var(--brand-cyan) 100%
-  );
-  --gradient-accent: linear-gradient(
-    135deg,
-    var(--brand-pink) 0%,
-    var(--brand-amber) 100%
-  );
-  --gradient-subtle: linear-gradient(
-    180deg,
-    transparent 0%,
-    rgba(139, 92, 246, 0.05) 100%
-  );
-  --gradient-mesh:
-    radial-gradient(at 0% 0%, rgba(139, 92, 246, 0.15) 0px, transparent 50%),
-    radial-gradient(at 100% 100%, rgba(6, 182, 212, 0.15) 0px, transparent 50%);
-
-  /* Elevation */
+  /* Elevation - Subtle Professional Shadows */
   --elevation-0: none;
-  --elevation-1: 0 1px 3px rgba(0, 0, 0, 0.3), 0 1px 2px rgba(0, 0, 0, 0.4);
-  --elevation-2: 0 3px 6px rgba(0, 0, 0, 0.35), 0 2px 4px rgba(0, 0, 0, 0.3);
-  --elevation-3: 0 10px 20px rgba(0, 0, 0, 0.4), 0 3px 6px rgba(0, 0, 0, 0.3);
-  --elevation-4: 0 15px 25px rgba(0, 0, 0, 0.45), 0 5px 10px rgba(0, 0, 0, 0.25);
-  --elevation-glow: 0 0 20px rgba(139, 92, 246, 0.3);
-
-  /* Glassmorphism */
-  --glass-bg: rgba(20, 20, 25, 0.7);
-  --glass-border: rgba(255, 255, 255, 0.1);
-  --glass-blur: blur(20px);
-
-  /* Typography Scale (1.25 ratio) */
-  --text-xs: 0.75rem;      /* 12px */
-  --text-sm: 0.875rem;     /* 14px */
-  --text-base: 1rem;       /* 16px */
-  --text-lg: 1.125rem;     /* 18px */
-  --text-xl: 1.25rem;      /* 20px */
-  --text-2xl: 1.563rem;    /* 25px */
-  --text-3xl: 1.953rem;    /* 31px */
-
-  /* Font Families */
-  --font-sans: 'Inter', -apple-system, BlinkMacSystemFont, 'Segoe UI', sans-serif;
-  --font-mono: 'JetBrains Mono', ui-monospace, SFMono-Regular, 'SF Mono',
-    Menlo, Consolas, monospace;
-
-  /* Line Heights */
+  --elevation-1: 0 1px 3px rgba(0, 0, 0, 0.2);
+  --elevation-2: 0 2px 6px rgba(0, 0, 0, 0.25);
+  --elevation-3: 0 4px 12px rgba(0, 0, 0, 0.3);
+  --elevation-4: 0 8px 24px rgba(0, 0, 0, 0.35);
+
+  /* Typography */
+  --font-sans: 'Inter', -apple-system, system-ui, sans-serif;
+  --font-mono: 'JetBrains Mono', 'SF Mono', Consolas, monospace;
+
+  --text-xs: 0.75rem;
+  --text-sm: 0.875rem;
+  --text-base: 1rem;
+  --text-lg: 1.125rem;
+  --text-xl: 1.25rem;
+  --text-2xl: 1.5rem;
+
   --leading-tight: 1.25;
   --leading-normal: 1.5;
   --leading-relaxed: 1.75;
 
-  /* Border Radius */
+  /* Spacing */
   --radius-sm: 4px;
-  --radius: 8px;
-  --radius-lg: 12px;
-  --radius-xl: 16px;
-  --radius-full: 9999px;
+  --radius: 6px;
+  --radius-lg: 8px;
+  --radius-xl: 12px;
 
-  /* Transitions */
-  --transition-fast: 150ms cubic-bezier(0.4, 0, 0.2, 1);
-  --transition-base: 300ms cubic-bezier(0.4, 0, 0.2, 1);
-  --transition-slow: 500ms cubic-bezier(0.4, 0, 0.2, 1);
-  --transition-spring: 600ms cubic-bezier(0.34, 1.56, 0.64, 1);
+  /* Transitions - Calm & Smooth */
+  --transition-fast: 120ms cubic-bezier(0.4, 0, 0.2, 1);
+  --transition-base: 200ms cubic-bezier(0.4, 0, 0.2, 1);
+  --transition-slow: 300ms cubic-bezier(0.4, 0, 0.2, 1);
 }
 
 html[data-theme="light"] {
-  /* Surface Hierarchy */
   --surface-0: #FFFFFF;
   --surface-1: #F9FAFB;
   --surface-2: #F3F4F6;
   --surface-3: #E5E7EB;
   --surface-4: #D1D5DB;
 
-  /* Text */
   --text-primary: #111827;
   --text-secondary: #374151;
   --text-tertiary: #6B7280;
   --text-muted: #9CA3AF;
 
-  /* Borders */
   --border-subtle: #E5E7EB;
   --border-default: #D1D5DB;
   --border-strong: #9CA3AF;
 
-  /* Elevation */
-  --elevation-1: 0 1px 3px rgba(0, 0, 0, 0.1), 0 1px 2px rgba(0, 0, 0, 0.06);
-  --elevation-2: 0 4px 6px rgba(0, 0, 0, 0.1), 0 2px 4px rgba(0, 0, 0, 0.06);
-  --elevation-3: 0 10px 15px rgba(0, 0, 0, 0.1), 0 4px 6px rgba(0, 0, 0, 0.05);
-  --elevation-4: 0 20px 25px rgba(0, 0, 0, 0.1), 0 10px 10px rgba(0, 0, 0, 0.04);
-  --elevation-glow: 0 0 20px rgba(139, 92, 246, 0.2);
+  --accent-primary: #2563EB;
+  --accent-secondary: #3B82F6;
+  --accent-subtle: rgba(37, 99, 235, 0.1);
+  --accent-muted: rgba(37, 99, 235, 0.05);
 
-  /* Glassmorphism */
-  --glass-bg: rgba(249, 250, 251, 0.8);
-  --glass-border: rgba(0, 0, 0, 0.1);
+  --elevation-1: 0 1px 3px rgba(0, 0, 0, 0.08);
+  --elevation-2: 0 2px 6px rgba(0, 0, 0, 0.12);
+  --elevation-3: 0 4px 12px rgba(0, 0, 0, 0.15);
+  --elevation-4: 0 8px 24px rgba(0, 0, 0, 0.18);
 }
 
-/* ========== Global Styles ========== */
 * {
   box-sizing: border-box;
   margin: 0;
   padding: 0;
 }
 
+.icon {
+  width: 1em;
+  height: 1em;
+  display: inline-block;
+  vertical-align: middle;
+  flex-shrink: 0;
+}
+
 html {
   scroll-behavior: smooth;
 }
 
 body {
   background: var(--surface-0);
-  background-image: var(--gradient-mesh);
   color: var(--text-primary);
   font-family: var(--font-sans);
   font-size: var(--text-base);
   line-height: var(--leading-normal);
   -webkit-font-smoothing: antialiased;
   -moz-osx-font-smoothing: grayscale;
-  overflow-x: hidden;
 }
 
 ::selection {
-  background: rgba(139, 92, 246, 0.3);
+  background: var(--accent-subtle);
   color: var(--text-primary);
 }
 
-/* ========== Layout ========== */
+/* Layout */
 .container {
   max-width: 1400px;
   margin: 0 auto;
   padding: 20px 20px 80px;
 }
 
-/* ========== Topbar ========== */
+/* Topbar */
 .topbar {
   position: sticky;
   top: 0;
   z-index: 100;
-  background: var(--glass-bg);
-  backdrop-filter: var(--glass-blur);
-  -webkit-backdrop-filter: var(--glass-blur);
-  border-bottom: 1px solid var(--glass-border);
-  box-shadow: var(--elevation-2);
+  background: rgba(14, 17, 23, 0.95);
+  backdrop-filter: blur(12px);
+  -webkit-backdrop-filter: blur(12px);
+  border-bottom: 1px solid var(--border-subtle);
+  box-shadow: var(--elevation-1);
+}
+
+html[data-theme="light"] .topbar {
+  background: rgba(255, 255, 255, 0.95);
 }
 
 .topbar-inner {
@@ -226,20 +202,17 @@
 .brand h1 {
   font-size: var(--text-xl);
   font-weight: 700;
-  background: var(--gradient-primary);
-  -webkit-background-clip: text;
-  -webkit-text-fill-color: transparent;
-  background-clip: text;
-  letter-spacing: -0.02em;
+  color: var(--text-primary);
+  letter-spacing: -0.01em;
 }
 
 .brand .sub {
   color: var(--text-tertiary);
   font-size: var(--text-sm);
   background: var(--surface-2);
-  padding: 3px 10px;
-  border-radius: var(--radius-full);
-  font-weight: 600;
+  padding: 2px 8px;
+  border-radius: 4px;
+  font-weight: 500;
   border: 1px solid var(--border-subtle);
 }
 
@@ -249,137 +222,311 @@
   gap: 8px;
 }
 
-/* ========== Buttons ========== */
+/* Buttons */
 .btn {
-  position: relative;
   display: inline-flex;
   align-items: center;
   justify-content: center;
-  gap: 8px;
-  padding: 8px 16px;
+  gap: 6px;
+  padding: 8px 14px;
   border-radius: var(--radius);
   border: 1px solid var(--border-default);
-  background: var(--surface-2);
+  background: var(--surface-1);
   color: var(--text-primary);
   cursor: pointer;
   font-size: var(--text-sm);
   font-weight: 500;
   font-family: var(--font-sans);
   transition: all var(--transition-base);
-  overflow: hidden;
   white-space: nowrap;
   user-select: none;
 }
 
-.btn::before {
-  content: '';
-  position: absolute;
-  inset: 0;
-  background: linear-gradient(
-    90deg,
-    transparent,
-    rgba(255, 255, 255, 0.1),
-    transparent
-  );
-  transform: translateX(-100%);
-  transition: transform var(--transition-slow);
-}
-
 .btn:hover {
-  transform: translateY(-2px);
-  box-shadow: var(--elevation-2);
+  background: var(--surface-2);
   border-color: var(--border-strong);
-  background: var(--surface-3);
-}
-
-.btn:hover::before {
-  transform: translateX(100%);
 }
 
 .btn:active {
-  transform: translateY(0);
-  box-shadow: var(--elevation-1);
+  transform: translateY(1px);
 }
 
 .btn:focus-visible {
-  outline: 2px solid var(--brand-purple);
+  outline: 2px solid var(--accent-primary);
   outline-offset: 2px;
 }
 
 .btn.ghost {
   background: transparent;
   border-color: transparent;
-  padding: 8px;
+  padding: 6px;
 }
 
 .btn.ghost:hover {
   background: var(--surface-2);
-  transform: scale(1.05);
 }
 
 .btn.primary {
-  background: var(--gradient-primary);
-  border-color: transparent;
+  background: var(--accent-primary);
+  border-color: var(--accent-primary);
   color: white;
-  font-weight: 600;
 }
 
 .btn.primary:hover {
-  box-shadow: var(--elevation-glow);
+  background: var(--accent-secondary);
+  border-color: var(--accent-secondary);
+}
+
+.btn.seg {
+  border: none;
+  background: transparent;
+  height: 30px;
+  padding: 6px 12px;
+}
+
+.btn.seg:hover {
+  background: var(--surface-0);
 }
 
-/* ========== Form Elements ========== */
+/* Form Elements */
 .select {
   padding: 8px 32px 8px 12px;
   height: 36px;
   border-radius: var(--radius);
   border: 1px solid var(--border-default);
-  background: var(--surface-2);
+  background: var(--surface-1);
   color: var(--text-primary);
   font-size: var(--text-sm);
   font-family: var(--font-sans);
   cursor: pointer;
   transition: all var(--transition-base);
-  appearance: none;
-  background-image: url("data:image/svg+xml,%3Csvg xmlns='http://www.w3.org/2000/svg' \
-width='12' height='12' viewBox='0 0 12 12'%3E%3Cpath fill='%239CA3AF' \
-d='M6 8L2 4h8z'/%3E%3C/svg%3E");
-  background-repeat: no-repeat;
-  background-position: right 12px center;
 }
 
 .select:hover {
   border-color: var(--border-strong);
-  background-color: var(--surface-3);
 }
 
 .select:focus {
-  outline: 2px solid var(--brand-purple);
+  outline: 2px solid var(--accent-primary);
   outline-offset: 2px;
 }
 
-/* ========== Section ========== */
+/* Sections */
 .section {
-  margin-top: 48px;
-  animation: fadeInUp 0.6s var(--transition-spring);
+  margin-top: 40px;
 }
 
-@keyframes fadeInUp {
-  from {
-    opacity: 0;
-    transform: translateY(20px);
-  }
-  to {
-    opacity: 1;
-    transform: translateY(0);
-  }
+/* Meta Panel - Collapsible Pro Design 2025 */
+.meta-panel {
+  margin-top: 22px;
+  margin-bottom: 20px;
+  background: var(--surface-1);
+  border: 1px solid var(--border-subtle);
+  border-radius: var(--radius-lg);
+  overflow: hidden;
+  transition: all var(--transition-base);
+}
+
+.meta-panel:hover {
+  border-color: var(--border-default);
+}
+
+.meta-header {
+  display: flex;
+  align-items: center;
+  justify-content: space-between;
+  padding: 14px 16px;
+  cursor: pointer;
+  user-select: none;
+  transition: background var(--transition-fast);
+}
+
+.meta-header:hover {
+  background: var(--surface-2);
+}
+
+.meta-header-left {
+  display: flex;
+  align-items: center;
+  gap: 12px;
+}
+
+.meta-toggle {
+  width: 18px;
+  height: 18px;
+  display: flex;
+  align-items: center;
+  justify-content: center;
+  transition: transform var(--transition-base);
+  color: var(--text-tertiary);
+  flex-shrink: 0;
+}
+
+.meta-toggle.collapsed {
+  transform: rotate(-90deg);
+}
+
+.meta-title {
+  font-size: var(--text-sm);
+  font-weight: 700;
+  color: var(--text-primary);
+  margin: 0;
+}
+
+.meta-badge {
+  font-size: 11px;
+  font-weight: 500;
+  color: var(--text-tertiary);
+  background: var(--surface-2);
+  padding: 2px 8px;
+  border-radius: var(--radius-sm);
+  border: 1px solid var(--border-subtle);
+}
+
+.meta-content {
+  overflow: hidden;
+  transition: max-height var(--transition-slow), opacity var(--transition-base);
+  max-height: 2000px;
+  opacity: 1;
+}
+
+.meta-content.collapsed {
+  max-height: 0;
+  opacity: 0;
+}
+
+.meta-body {
+  padding: 14px 16px 16px;
+  border-top: 1px solid var(--border-subtle);
+}
+
+.meta-grid {
+  margin: 0;
+  display: grid;
+  grid-template-columns: repeat(auto-fit, minmax(300px, 1fr));
+  gap: 12px;
+  row-gap: 10px;
+}
+
+.meta-row {
+  display: flex;
+  flex-direction: column;
+  gap: 6px;
+  padding: 10px 12px;
+  background: var(--surface-0);
+  border: 1px solid var(--border-subtle);
+  border-radius: var(--radius);
+  transition: all var(--transition-fast);
+  margin: 0;
+  min-width: 0;
+}
+
+.meta-row:hover {
+  background: var(--surface-2);
+  border-color: var(--border-default);
+}
+
+.meta-row-wide {
+  grid-column: 1 / -1;
+}
+
+.meta-row dt {
+  color: var(--text-muted);
+  font-size: var(--text-xs);
+  font-weight: 600;
+  text-transform: uppercase;
+  letter-spacing: 0.02em;
+  display: flex;
+  align-items: center;
+  gap: 6px;
+}
+
+.meta-row dd {
+  margin: 0;
+  color: var(--text-primary);
+  font-family: var(--font-mono);
+  font-size: var(--text-xs);
+  line-height: 1.4;
+  position: relative;
+  overflow: hidden;
+}
+
+/* Path truncation with hover tooltip */
+.meta-path {
+  display: block;
+  white-space: nowrap;
+  overflow: hidden;
+  text-overflow: ellipsis;
+  max-width: 100%;
+  cursor: help;
+  position: relative;
+  padding: 2px 0;
+}
+
+.meta-path:hover {
+  color: var(--accent-primary);
+}
+
+.meta-path-tooltip {
+  position: absolute;
+  left: 0;
+  bottom: calc(100% + 8px);
+  background: var(--surface-3);
+  color: var(--text-primary);
+  padding: 8px 12px;
+  border-radius: var(--radius);
+  font-size: var(--text-xs);
+  white-space: normal;
+  word-break: break-all;
+  border: 1px solid var(--border-default);
+  box-shadow: var(--elevation-3);
+  opacity: 0;
+  pointer-events: none;
+  transition: opacity var(--transition-fast);
+  z-index: 1000;
+  max-width: 600px;
+  min-width: 200px;
+}
+
+.meta-path:hover .meta-path-tooltip {
+  opacity: 1;
+}
+
+/* Boolean value badges */
+.meta-bool {
+  display: inline-flex;
+  align-items: center;
+  padding: 3px 8px;
+  border-radius: var(--radius-sm);
+  font-size: 11px;
+  font-weight: 500;
+  font-family: var(--font-sans);
+}
+
+.meta-bool-true {
+  background: var(--success-subtle);
+  color: var(--success);
+  border: 1px solid rgba(16, 185, 129, 0.3);
+}
+
+.meta-bool-false {
+  background: var(--surface-2);
+  color: var(--text-muted);
+  border: 1px solid var(--border-default);
+}
+
+.meta-bool-na {
+  background: var(--surface-2);
+  color: var(--text-tertiary);
+  border: 1px solid var(--border-subtle);
+  font-style: italic;
 }
 
 .section-head {
   display: flex;
   flex-direction: column;
-  gap: 20px;
-  margin-bottom: 24px;
+  gap: 16px;
+  margin-bottom: 20px;
 }
 
 .section-head h2 {
@@ -388,20 +535,19 @@
   display: flex;
   align-items: center;
   gap: 12px;
-  letter-spacing: -0.02em;
+  letter-spacing: -0.01em;
 }
 
-/* ========== Toolbar ========== */
+/* Toolbar */
 .section-toolbar {
   display: flex;
   justify-content: space-between;
   align-items: center;
   gap: 16px;
-  padding: 16px;
+  padding: 12px;
   background: var(--surface-1);
   border: 1px solid var(--border-subtle);
   border-radius: var(--radius-lg);
-  box-shadow: var(--elevation-1);
 }
 
 .toolbar-left {
@@ -435,9 +581,8 @@
   }
 }
 
-/* ========== Search ========== */
+/* Search */
 .search-wrap {
-  position: relative;
   display: flex;
   align-items: center;
   gap: 8px;
@@ -445,13 +590,12 @@
   border-radius: var(--radius);
   border: 1px solid var(--border-default);
   background: var(--surface-0);
-  min-width: 300px;
+  min-width: 280px;
   transition: all var(--transition-base);
 }
 
 .search-wrap:focus-within {
-  border-color: var(--brand-purple);
-  box-shadow: 0 0 0 3px rgba(139, 92, 246, 0.1);
+  border-color: var(--accent-primary);
   background: var(--surface-1);
 }
 
@@ -478,25 +622,10 @@
 .segmented {
   display: inline-flex;
   background: var(--surface-2);
-  padding: 3px;
+  padding: 2px;
   border-radius: var(--radius);
-  border: 1px solid var(--border-subtle);
-}
-
-.btn.seg {
-  border: none;
-  background: transparent;
-  height: 32px;
-  font-size: var(--text-sm);
-  border-radius: calc(var(--radius) - 3px);
-}
-
-.btn.seg:hover {
-  background: var(--surface-0);
-  box-shadow: var(--elevation-1);
 }
 
-/* ========== Pager ========== */
 .pager {
   display: inline-flex;
   align-items: center;
@@ -513,39 +642,46 @@
   font-variant-numeric: tabular-nums;
 }
 
-/* ========== Pills/Badges ========== */
+/* Pills */
 .pill {
   display: inline-flex;
   align-items: center;
-  padding: 4px 12px;
-  border-radius: var(--radius-full);
+  padding: 3px 10px;
+  border-radius: 12px;
   font-size: var(--text-xs);
   font-weight: 600;
   line-height: 1;
-  letter-spacing: 0.02em;
-  text-transform: uppercase;
 }
 
 .pill.small {
   padding: 2px 8px;
-  font-size: 10px;
+  font-size: 11px;
 }
 
 .pill-func {
-  color: var(--brand-purple);
-  background: rgba(139, 92, 246, 0.15);
-  border: 1px solid rgba(139, 92, 246, 0.3);
+  color: var(--accent-primary);
+  background: var(--accent-subtle);
+  border: 1px solid var(--accent-primary);
+  opacity: 0.9;
 }
 
 .pill-block {
   color: var(--success);
-  background: rgba(16, 185, 129, 0.15);
-  border: 1px solid rgba(16, 185, 129, 0.3);
+  background: var(--success-subtle);
+  border: 1px solid var(--success);
+  opacity: 0.9;
+}
+
+.pill-segment {
+  color: var(--warning);
+  background: var(--warning-subtle);
+  border: 1px solid var(--warning);
+  opacity: 0.9;
 }
 
-/* ========== Groups/Cards ========== */
+/* Groups */
 .group {
-  margin-bottom: 20px;
+  margin-bottom: 16px;
   border: 1px solid var(--border-subtle);
   border-radius: var(--radius-lg);
   background: var(--surface-1);
@@ -555,30 +691,32 @@
 }
 
 .group:hover {
-  transform: translateY(-2px);
-  box-shadow: var(--elevation-3);
-  border-color: var(--brand-purple);
+  box-shadow: var(--elevation-2);
+  border-color: var(--border-default);
 }
 
 .group-head {
   display: flex;
   justify-content: space-between;
   align-items: center;
-  padding: 16px 20px;
+  gap: 12px;
+  padding: 14px 16px;
   background: var(--surface-2);
   border-bottom: 1px solid var(--border-subtle);
   cursor: pointer;
-  transition: all var(--transition-fast);
+  transition: background var(--transition-fast);
+  min-width: 0;
 }
 
 .group:hover .group-head {
-  background: var(--gradient-subtle);
+  background: var(--surface-3);
 }
 
 .group-left {
   display: flex;
   align-items: center;
-  gap: 12px;
+  gap: 10px;
+  min-width: 0;
 }
 
 .group-title {
@@ -590,27 +728,50 @@
 .group-right {
   display: flex;
   align-items: center;
-  gap: 12px;
+  gap: 10px;
+  min-width: 0;
+  flex: 1;
+  justify-content: flex-end;
 }
 
 .gkey {
+  display: block;
   font-family: var(--font-mono);
   font-size: var(--text-xs);
   color: var(--text-tertiary);
   background: var(--surface-0);
-  padding: 4px 8px;
+  padding: 3px 6px;
   border-radius: var(--radius-sm);
   border: 1px solid var(--border-subtle);
+  white-space: nowrap;
+  overflow: hidden;
+  text-overflow: ellipsis;
+  max-width: min(52vw, 700px);
+}
+
+@media (max-width: 900px) {
+  .group-head {
+    flex-direction: column;
+    align-items: flex-start;
+  }
+
+  .group-right {
+    width: 100%;
+    justify-content: flex-start;
+  }
+
+  .gkey {
+    max-width: 100%;
+  }
 }
 
-/* ========== Chevron Button ========== */
 .chev {
   display: flex;
   align-items: center;
   justify-content: center;
-  width: 28px;
-  height: 28px;
-  border-radius: var(--radius);
+  width: 24px;
+  height: 24px;
+  border-radius: var(--radius-sm);
   border: 1px solid var(--border-default);
   background: var(--surface-1);
   color: var(--text-muted);
@@ -621,26 +782,24 @@
 
 .chev:hover {
   color: var(--text-primary);
-  border-color: var(--brand-purple);
-  background: var(--surface-2);
-  transform: scale(1.1);
+  border-color: var(--accent-primary);
 }
 
 .chev svg {
   transition: transform var(--transition-base);
 }
 
-/* ========== Items Container ========== */
+/* Items */
 .items {
-  padding: 20px;
+  padding: 16px;
   background: var(--surface-0);
 }
 
 .item-pair {
   display: grid;
   grid-template-columns: 1fr 1fr;
-  gap: 20px;
-  margin-bottom: 20px;
+  gap: 16px;
+  margin-bottom: 16px;
   min-width: 0;
 }
 
@@ -654,7 +813,6 @@
   }
 }
 
-/* ========== Item Card ========== */
 .item {
   border: 1px solid var(--border-subtle);
   border-radius: var(--radius-lg);
@@ -663,41 +821,45 @@
   flex-direction: column;
   min-width: 0;
   background: var(--surface-1);
-  transition: all var(--transition-base);
 }
 
 .item:hover {
-  border-color: var(--brand-cyan);
-  box-shadow: var(--elevation-2);
+  border-color: var(--border-default);
 }
 
 .item-head {
-  padding: 12px 16px;
+  padding: 10px 14px;
   background: var(--surface-2);
   border-bottom: 1px solid var(--border-subtle);
   font-size: var(--text-sm);
   font-weight: 600;
-  color: var(--brand-purple);
+  color: var(--accent-primary);
   font-family: var(--font-mono);
+  white-space: nowrap;
+  overflow: hidden;
+  text-overflow: ellipsis;
 }
 
 .item-file {
-  padding: 8px 16px;
+  padding: 8px 14px;
   background: var(--surface-3);
   border-bottom: 1px solid var(--border-subtle);
   font-family: var(--font-mono);
   font-size: var(--text-xs);
   color: var(--text-tertiary);
+  white-space: nowrap;
+  overflow: hidden;
+  text-overflow: ellipsis;
 }
 
-/* ========== Code Display ========== */
+/* Code Display */
 .codebox {
   position: relative;
   margin: 0;
   padding: 0;
   font-family: var(--font-mono);
   font-size: 13px;
-  line-height: 1.6;
+  line-height: 1.5;
   overflow-x: auto;
   overflow-y: auto;
   background: var(--surface-0);
@@ -708,7 +870,7 @@
 
 .codebox pre {
   margin: 0;
-  padding: 16px;
+  padding: 14px;
   white-space: pre;
   word-wrap: normal;
   overflow-wrap: normal;
@@ -725,46 +887,9 @@
   color: var(--text-secondary);
 }
 
-/* Copy button for code blocks */
-.copy-btn {
-  position: absolute;
-  top: 12px;
-  right: 12px;
-  display: flex;
-  align-items: center;
-  gap: 6px;
-  padding: 6px 12px;
-  background: var(--surface-2);
-  border: 1px solid var(--border-default);
-  border-radius: var(--radius);
-  color: var(--text-secondary);
-  font-size: var(--text-xs);
-  font-weight: 500;
-  cursor: pointer;
-  opacity: 0;
-  transition: all var(--transition-base);
-  z-index: 10;
-}
-
-.codebox:hover .copy-btn {
-  opacity: 1;
-}
-
-.copy-btn:hover {
-  background: var(--surface-3);
-  border-color: var(--brand-purple);
-  color: var(--text-primary);
-}
-
-.copy-btn.copied {
-  background: var(--success);
-  border-color: var(--success);
-  color: white;
-}
-
-/* ========== Empty State ========== */
+/* Empty State */
 .empty {
-  padding: 80px 20px;
+  padding: 60px 20px;
   display: flex;
   justify-content: center;
   align-items: center;
@@ -772,17 +897,16 @@
 
 .empty-card {
   text-align: center;
-  padding: 48px;
+  padding: 40px;
   background: var(--surface-1);
   border: 1px solid var(--border-subtle);
   border-radius: var(--radius-xl);
   max-width: 500px;
-  box-shadow: var(--elevation-2);
 }
 
 .empty-icon {
   color: var(--success);
-  margin-bottom: 20px;
+  margin-bottom: 16px;
   display: flex;
   justify-content: center;
   font-size: 48px;
@@ -790,14 +914,14 @@
 
 .empty-card h2 {
   font-size: var(--text-xl);
-  margin-bottom: 12px;
+  margin-bottom: 10px;
   color: var(--text-primary);
 }
 
 .empty-card p {
   color: var(--text-secondary);
   line-height: var(--leading-relaxed);
-  margin-bottom: 8px;
+  margin-bottom: 6px;
 }
 
 .empty-card .muted {
@@ -805,17 +929,31 @@
   font-size: var(--text-sm);
 }
 
-/* ========== Footer ========== */
+/* Footer */
 .footer {
-  margin-top: 80px;
+  margin-top: 60px;
   text-align: center;
   color: var(--text-muted);
   font-size: var(--text-sm);
   border-top: 1px solid var(--border-subtle);
-  padding-top: 32px;
+  padding-top: 24px;
+}
+
+.kbd {
+  display: inline-flex;
+  align-items: center;
+  justify-content: center;
+  padding: 2px 6px;
+  background: var(--surface-2);
+  border: 1px solid var(--border-default);
+  border-radius: var(--radius-sm);
+  font-family: var(--font-mono);
+  font-size: 11px;
+  color: var(--text-tertiary);
+  box-shadow: 0 1px 0 var(--border-subtle);
 }
 
-/* ========== Toast Notifications ========== */
+/* Toast Notifications */
 .toast-container {
   position: fixed;
   top: 80px;
@@ -823,24 +961,24 @@
   z-index: 1000;
   display: flex;
   flex-direction: column;
-  gap: 12px;
+  gap: 10px;
   pointer-events: none;
 }
 
 .toast {
   display: flex;
   align-items: center;
-  gap: 12px;
+  gap: 10px;
   padding: 12px 16px;
-  background: var(--glass-bg);
-  backdrop-filter: var(--glass-blur);
-  border: 1px solid var(--glass-border);
-  border-radius: var(--radius);
+  background: var(--surface-1);
+  border: 1px solid var(--border-default);
+  border-radius: var(--radius-lg);
   box-shadow: var(--elevation-3);
-  min-width: 300px;
-  transform: translateX(400px);
+  min-width: 280px;
+  max-width: 400px;
+  transform: translateX(450px);
   opacity: 0;
-  transition: all var(--transition-spring);
+  transition: all var(--transition-slow);
   pointer-events: auto;
 }
 
@@ -867,17 +1005,15 @@
   cursor: pointer;
   font-size: var(--text-lg);
   padding: 0;
-  width: 24px;
-  height: 24px;
+  width: 20px;
+  height: 20px;
   display: flex;
   align-items: center;
   justify-content: center;
-  border-radius: var(--radius-sm);
-  transition: all var(--transition-fast);
+  transition: color var(--transition-fast);
 }
 
 .toast-close:hover {
-  background: var(--surface-2);
   color: var(--text-primary);
 }
 
@@ -886,22 +1022,279 @@
 .toast-warning { border-left: 3px solid var(--warning); }
 .toast-error { border-left: 3px solid var(--error); }
 
-/* ========== Keyboard Shortcuts Hint ========== */
-.kbd {
-  display: inline-flex;
+/* Command Palette */
+.command-palette {
+  position: fixed;
+  inset: 0;
+  z-index: 2000;
+  display: none;
+}
+
+.command-palette.show {
+  display: block;
+}
+
+.command-backdrop {
+  position: absolute;
+  inset: 0;
+  background: rgba(0, 0, 0, 0.7);
+  backdrop-filter: blur(4px);
+  -webkit-backdrop-filter: blur(4px);
+  animation: fadeIn 0.2s ease-out;
+}
+
+.command-dialog {
+  position: absolute;
+  top: 15%;
+  left: 50%;
+  transform: translateX(-50%);
+  width: min(90vw, 600px);
+  max-height: 70vh;
+  background: var(--surface-1);
+  border: 1px solid var(--border-default);
+  border-radius: var(--radius-lg);
+  box-shadow: var(--elevation-4);
+  display: flex;
+  flex-direction: column;
+  animation: slideDown 0.25s cubic-bezier(0.16, 1, 0.3, 1);
+}
+
+@keyframes fadeIn {
+  from { opacity: 0; }
+  to { opacity: 1; }
+}
+
+@keyframes slideDown {
+  from {
+    opacity: 0;
+    transform: translateX(-50%) translateY(-10px);
+  }
+  to {
+    opacity: 1;
+    transform: translateX(-50%) translateY(0);
+  }
+}
+
+.command-input-wrap {
+  padding: 16px;
+  border-bottom: 1px solid var(--border-subtle);
+}
+
+.command-input {
+  width: 100%;
+  padding: 10px 12px;
+  background: var(--surface-0);
+  border: 1px solid var(--border-default);
+  border-radius: var(--radius);
+  color: var(--text-primary);
+  font-size: var(--text-base);
+  font-family: var(--font-sans);
+}
+
+.command-input:focus {
+  outline: 2px solid var(--accent-primary);
+  outline-offset: 2px;
+}
+
+.command-input::placeholder {
+  color: var(--text-muted);
+}
+
+.command-results {
+  overflow-y: auto;
+  max-height: calc(70vh - 80px);
+  padding: 8px;
+}
+
+.command-section {
+  margin-bottom: 12px;
+}
+
+.command-section-title {
+  font-size: var(--text-xs);
+  font-weight: 600;
+  color: var(--text-muted);
+  text-transform: uppercase;
+  letter-spacing: 0.05em;
+  padding: 6px 12px;
+  margin-bottom: 4px;
+}
+
+.command-item {
+  display: flex;
   align-items: center;
-  justify-content: center;
-  padding: 2px 6px;
+  justify-content: space-between;
+  width: 100%;
+  padding: 10px 12px;
+  background: transparent;
+  border: none;
+  border-radius: var(--radius);
+  color: var(--text-primary);
+  font-size: var(--text-sm);
+  font-family: var(--font-sans);
+  text-align: left;
+  cursor: pointer;
+  transition: background var(--transition-fast);
+}
+
+.command-item:hover,
+.command-item.selected,
+.command-item[aria-selected='true'] {
+  background: var(--accent-muted);
+}
+
+.command-item-left {
+  display: flex;
+  align-items: center;
+  gap: 10px;
+  flex: 1;
+}
+
+.command-icon {
+  font-size: var(--text-lg);
+  width: 20px;
+  text-align: center;
+}
+
+.command-shortcut {
+  font-size: var(--text-xs);
+  color: var(--text-muted);
+  font-family: var(--font-mono);
   background: var(--surface-2);
-  border: 1px solid var(--border-default);
+  padding: 2px 6px;
   border-radius: var(--radius-sm);
-  font-family: var(--font-mono);
-  font-size: var(--text-xs);
+  border: 1px solid var(--border-subtle);
+}
+
+.command-empty {
+  color: var(--text-muted);
+  font-size: var(--text-sm);
+  padding: 12px;
+}
+
+/* Stats Dashboard */
+.stats-grid {
+  display: grid;
+  grid-template-columns: repeat(auto-fit, minmax(200px, 1fr));
+  gap: 16px;
+  margin: 24px 0;
+}
+
+.stat-card {
+  padding: 16px 18px;
+  background: var(--surface-1);
+  border: 1px solid var(--border-subtle);
+  border-radius: var(--radius-lg);
+  text-align: left;
+  display: grid;
+  grid-template-columns: auto 1fr;
+  grid-template-rows: auto auto;
+  gap: 2px 12px;
+  align-items: center;
+}
+
+.stat-icon {
+  grid-column: 1;
+  grid-row: 1 / span 2;
+  width: 38px;
+  height: 38px;
   color: var(--text-tertiary);
-  box-shadow: 0 1px 0 var(--border-subtle);
+  opacity: 0.92;
+}
+
+.stat-icon .icon {
+  width: 100%;
+  height: 100%;
+}
+
+.stat-value {
+  grid-column: 2;
+  grid-row: 1;
+  font-size: var(--text-2xl);
+  font-weight: 700;
+  color: var(--text-primary);
+  line-height: 1.1;
+}
+
+.stat-label {
+  grid-column: 2;
+  grid-row: 2;
+  font-size: var(--text-sm);
+  color: var(--text-muted);
+  margin: 0;
 }
 
-/* ========== Accessibility ========== */
+.stat-trend {
+  font-size: var(--text-sm);
+  font-weight: 600;
+}
+
+.stat-trend.up {
+  color: var(--success);
+}
+
+.stat-trend.down {
+  color: var(--error);
+}
+
+.stat-trend.neutral {
+  color: var(--text-muted);
+}
+
+/* Chart Container */
+.chart-container {
+  background: var(--surface-1);
+  border: 1px solid var(--border-subtle);
+  border-radius: var(--radius-lg);
+  padding: 20px;
+  margin: 24px 0;
+}
+
+.chart-title {
+  font-size: var(--text-lg);
+  font-weight: 600;
+  color: var(--text-primary);
+  margin-bottom: 16px;
+}
+
+.chart-canvas {
+  width: 100%;
+  height: 300px;
+}
+
+@media print {
+  .topbar,
+  .section-toolbar,
+  .toast-container,
+  .command-palette,
+  .footer,
+  #command-btn,
+  #theme-toggle,
+  #export-btn {
+    display: none !important;
+  }
+
+  body {
+    background: #fff;
+    color: #111;
+  }
+
+  .container {
+    max-width: none;
+    padding: 0;
+  }
+
+  .group,
+  .item {
+    break-inside: avoid;
+  }
+
+  .codebox {
+    max-height: none;
+  }
+}
+
+/* Accessibility */
 @media (prefers-reduced-motion: reduce) {
   *,
   *::before,
@@ -913,14 +1306,14 @@
 }
 
 :focus-visible {
-  outline: 2px solid var(--brand-purple);
+  outline: 2px solid var(--accent-primary);
   outline-offset: 2px;
 }
 
-/* ========== Scrollbar ========== */
+/* Scrollbar */
 ::-webkit-scrollbar {
-  width: 10px;
-  height: 10px;
+  width: 8px;
+  height: 8px;
 }
 
 ::-webkit-scrollbar-track {
@@ -929,32 +1322,16 @@
 
 ::-webkit-scrollbar-thumb {
   background: var(--surface-3);
-  border-radius: var(--radius);
+  border-radius: 4px;
 }
 
 ::-webkit-scrollbar-thumb:hover {
   background: var(--surface-4);
 }
 
-/* ========== Syntax Highlighting (Pygments Override) ========== */
+/* Syntax Highlighting */
 ${pyg_dark}
 ${pyg_light}
-
-/* Custom syntax highlighting enhancements */
-html[data-theme="dark"] .codebox .k,
-html[data-theme="dark"] .codebox .kd,
-html[data-theme="dark"] .codebox .kn { color: #C792EA; } /* Keywords */
-html[data-theme="dark"] .codebox .s,
-html[data-theme="dark"] .codebox .s1,
-html[data-theme="dark"] .codebox .s2 { color: #C3E88D; } /* Strings */
-html[data-theme="dark"] .codebox .nf { color: #82AAFF; } /* Functions */
-html[data-theme="dark"] .codebox .nb { color: #FFCB6B; } /* Builtins */
-html[data-theme="dark"] .codebox .c,
-html[data-theme="dark"] .codebox .c1 {
-  color: #546E7A;
-  font-style: italic;
-} /* Comments */
-
 </style>
 </head>
 
@@ -962,6 +1339,36 @@
 <!-- Toast Container -->
 <div class="toast-container"></div>
 
+<!-- Command Palette -->
+<div class="command-palette" id="command-palette" aria-hidden="true">
+  <div class="command-backdrop"></div>
+  <div
+    class="command-dialog"
+    role="dialog"
+    aria-modal="true"
+    aria-label="Command palette"
+  >
+    <div class="command-input-wrap">
+      <input
+        type="text"
+        class="command-input"
+        id="command-input"
+        placeholder="Type a command or search..."
+        aria-label="Command search"
+        autocomplete="off"
+      />
+    </div>
+    <div
+      class="command-results"
+      id="command-results"
+      role="listbox"
+      aria-label="Command results"
+    >
+      <!-- Populated dynamically -->
+    </div>
+  </div>
+</div>
+
 <!-- Topbar -->
 <div class="topbar">
   <div class="topbar-inner">
@@ -970,8 +1377,21 @@
       <div class="sub">v${version}</div>
     </div>
     <div class="top-actions">
+      <button class="btn" type="button" id="command-btn" title="Command Palette (⌘K)">
+        <svg
+          width="16"
+          height="16"
+          viewBox="0 0 24 24"
+          fill="none"
+          stroke="currentColor"
+          stroke-width="2"
+        >
+          <path d="M7 20l4-16m2 16l4-16M6 9h14M4 15h14"></path>
+        </svg>
+        <span>⌘K</span>
+      </button>
       <button class="btn" type="button" id="theme-toggle" title="Toggle theme (T)">
-        ${icon_theme} Theme
+        ${icon_theme}
       </button>
       <button class="btn primary" type="button" id="export-btn" title="Export report">
         <svg
@@ -994,108 +1414,844 @@
 
 <!-- Main Content -->
 <div class="container">
+
+${report_meta_html}
+
+<!-- Stats Dashboard -->
+<div class="stats-grid" id="stats-dashboard" style="display: none;">
+  <!-- Populated dynamically -->
+</div>
+
+<!-- Charts -->
+<div class="chart-container" id="chart-container" style="display: none;">
+  <div class="chart-title">Clone Group Distribution</div>
+  <canvas id="complexity-chart" class="chart-canvas"></canvas>
+</div>
+
 ${empty_state_html}
 
 ${func_section}
 ${block_section}
+${segment_section}
 
 <div class="footer">
-  Generated by CodeClone v${version} • Press <kbd class="kbd">/</kbd> to search •
-  <kbd class="kbd">T</kbd> to toggle theme
+  Generated by CodeClone v${version} •
+  <kbd class="kbd">/</kbd> search •
+  <kbd class="kbd">⌘K</kbd> commands •
+  <kbd class="kbd">T</kbd> theme
 </div>
 </div>
 
 <script>
-(() => {
+(function() {
   'use strict';
 
-  // ========== Theme Management ==========
-  const htmlEl = document.documentElement;
-  const btnTheme = document.getElementById('theme-toggle');
+  // ========== Utilities ==========
+  const $$ = (sel) => document.querySelector(sel);
+  const $$$$ = (sel) => document.querySelectorAll(sel);
+  const svg = (parts) => parts.join('');
+  const ICONS = {
+    info: svg([
+      '<svg class="icon" viewBox="0 0 24 24" aria-hidden="true">',
+      '<circle cx="12" cy="12" r="10" fill="none" stroke="currentColor"',
+      ' stroke-width="2"></circle>',
+      '<path d="M12 10v7" fill="none" stroke="currentColor"',
+      ' stroke-width="2"></path>',
+      '<circle cx="12" cy="7" r="1.25" fill="currentColor"></circle>',
+      '</svg>'
+    ]),
+    success: svg([
+      '<svg class="icon" viewBox="0 0 24 24" aria-hidden="true">',
+      '<circle cx="12" cy="12" r="10" fill="none" stroke="currentColor"',
+      ' stroke-width="2"></circle>',
+      '<path d="M7 12l3 3 7-7" fill="none" stroke="currentColor"',
+      ' stroke-width="2"></path>',
+      '</svg>'
+    ]),
+    warning: svg([
+      '<svg class="icon" viewBox="0 0 24 24" aria-hidden="true">',
+      '<path d="M12 3l10 18H2L12 3z" fill="none" stroke="currentColor"',
+      ' stroke-width="2"></path>',
+      '<path d="M12 9v5" fill="none" stroke="currentColor"',
+      ' stroke-width="2"></path>',
+      '<circle cx="12" cy="17" r="1.25" fill="currentColor"></circle>',
+      '</svg>'
+    ]),
+    error: svg([
+      '<svg class="icon" viewBox="0 0 24 24" aria-hidden="true">',
+      '<circle cx="12" cy="12" r="10" fill="none" stroke="currentColor"',
+      ' stroke-width="2"></circle>',
+      '<path d="M8 8l8 8M16 8l-8 8" fill="none" stroke="currentColor"',
+      ' stroke-width="2"></path>',
+      '</svg>'
+    ]),
+    exportJson: svg([
+      '<svg class="icon" viewBox="0 0 24 24" aria-hidden="true">',
+      '<path d="M12 3v12" fill="none" stroke="currentColor"',
+      ' stroke-width="2"></path>',
+      '<path d="M7 10l5 5 5-5" fill="none" stroke="currentColor"',
+      ' stroke-width="2"></path>',
+      '<path d="M5 21h14" fill="none" stroke="currentColor"',
+      ' stroke-width="2"></path>',
+      '</svg>'
+    ]),
+    exportPdf: svg([
+      '<svg class="icon" viewBox="0 0 24 24" aria-hidden="true">',
+      '<path d="M6 2h9l5 5v15H6z" fill="none" stroke="currentColor"',
+      ' stroke-width="2"></path>',
+      '<path d="M15 2v5h5" fill="none" stroke="currentColor"',
+      ' stroke-width="2"></path>',
+      '</svg>'
+    ]),
+    stats: svg([
+      '<svg class="icon" viewBox="0 0 24 24" aria-hidden="true">',
+      '<path d="M4 20V10M10 20V4M16 20v-8M22 20V7" fill="none"',
+      ' stroke="currentColor" stroke-width="2"></path>',
+      '</svg>'
+    ]),
+    charts: svg([
+      '<svg class="icon" viewBox="0 0 24 24" aria-hidden="true">',
+      '<path d="M4 20h16" fill="none" stroke="currentColor"',
+      ' stroke-width="2"></path>',
+      '<path d="M6 16l4-4 4 3 4-6" fill="none" stroke="currentColor"',
+      ' stroke-width="2"></path>',
+      '</svg>'
+    ]),
+    refresh: svg([
+      '<svg class="icon" viewBox="0 0 24 24" aria-hidden="true">',
+      '<path d="M20 6v6h-6" fill="none" stroke="currentColor"',
+      ' stroke-width="2"></path>',
+      '<path d="M4 18v-6h6" fill="none" stroke="currentColor"',
+      ' stroke-width="2"></path>',
+      '<path d="M20 12a8 8 0 0 0-14-5" fill="none"',
+      ' stroke="currentColor" stroke-width="2"></path>',
+      '<path d="M4 12a8 8 0 0 0 14 5" fill="none"',
+      ' stroke="currentColor" stroke-width="2"></path>',
+      '</svg>'
+    ]),
+    search: svg([
+      '<svg class="icon" viewBox="0 0 24 24" aria-hidden="true">',
+      '<circle cx="11" cy="11" r="7" fill="none" stroke="currentColor"',
+      ' stroke-width="2"></circle>',
+      '<path d="M20 20l-3.5-3.5" fill="none" stroke="currentColor"',
+      ' stroke-width="2"></path>',
+      '</svg>'
+    ]),
+    scrollTop: svg([
+      '<svg class="icon" viewBox="0 0 24 24" aria-hidden="true">',
+      '<path d="M12 19V5" fill="none" stroke="currentColor"',
+      ' stroke-width="2"></path>',
+      '<path d="M5 12l7-7 7 7" fill="none" stroke="currentColor"',
+      ' stroke-width="2"></path>',
+      '</svg>'
+    ]),
+    scrollBottom: svg([
+      '<svg class="icon" viewBox="0 0 24 24" aria-hidden="true">',
+      '<path d="M12 5v14" fill="none" stroke="currentColor"',
+      ' stroke-width="2"></path>',
+      '<path d="M5 12l7 7 7-7" fill="none" stroke="currentColor"',
+      ' stroke-width="2"></path>',
+      '</svg>'
+    ]),
+    theme: svg([
+      '<svg class="icon" viewBox="0 0 24 24" aria-hidden="true">',
+      '<path d="M21 12a9 9 0 1 1-9-9 7 7 0 0 0 9 9z"',
+      ' fill="none" stroke="currentColor" stroke-width="2"></path>',
+      '</svg>'
+    ]),
+    expand: svg([
+      '<svg class="icon" viewBox="0 0 24 24" aria-hidden="true">',
+      '<path d="M8 3H3v5M21 8V3h-5M3 16v5h5M21 21v-5h-5"',
+      ' fill="none" stroke="currentColor" stroke-width="2"></path>',
+      '</svg>'
+    ]),
+    collapse: svg([
+      '<svg class="icon" viewBox="0 0 24 24" aria-hidden="true">',
+      '<path d="M8 3v5H3M21 8h-5V3M3 16h5v5M16 21v-5h5"',
+      ' fill="none" stroke="currentColor" stroke-width="2"></path>',
+      '</svg>'
+    ]),
+    cloneGroups: svg([
+      '<svg class="icon" viewBox="0 0 24 24" aria-hidden="true">',
+      '<rect x="3" y="4" width="8" height="8" fill="none"',
+      ' stroke="currentColor" stroke-width="2"></rect>',
+      '<rect x="13" y="4" width="8" height="8" fill="none"',
+      ' stroke="currentColor" stroke-width="2"></rect>',
+      '<rect x="3" y="14" width="8" height="8" fill="none"',
+      ' stroke="currentColor" stroke-width="2"></rect>',
+      '</svg>'
+    ]),
+    totalClones: svg([
+      '<svg class="icon" viewBox="0 0 24 24" aria-hidden="true">',
+      '<rect x="4" y="3" width="16" height="18" rx="2" fill="none"',
+      ' stroke="currentColor" stroke-width="2"></rect>',
+      '<path d="M8 7h8M8 11h8M8 15h5" fill="none"',
+      ' stroke="currentColor" stroke-width="2"></path>',
+      '</svg>'
+    ]),
+    avgGroup: svg([
+      '<svg class="icon" viewBox="0 0 24 24" aria-hidden="true">',
+      '<path d="M4 18h16M6 15l3-4 4 3 5-7" fill="none"',
+      ' stroke="currentColor" stroke-width="2"></path>',
+      '</svg>'
+    ]),
+    largestGroup: svg([
+      '<svg class="icon" viewBox="0 0 24 24" aria-hidden="true">',
+      '<path d="M12 3l3 6 6 1-4 4 1 6-6-3-6 3 1-6-4-4',
+      ' 6-1 3-6z" fill="none" stroke="currentColor" stroke-width="2"></path>',
+      '</svg>'
+    ])
+  };
+
+  // ========== State Management ==========
+  const state = {
+    theme: 'dark',
+    commandPaletteOpen: false,
+    chartVisible: false,
+    stats: {
+      totalGroups: 0,
+      totalItems: 0,
+      avgGroupSize: 0,
+      largestGroup: 0
+    }
+  };
+
+  function getPrimarySearchInput() {
+    const inputs = Array.from($$$$('.search'));
+    for (const input of inputs) {
+      if (input.offsetParent !== null) return input;
+    }
+    return inputs[0] || null;
+  }
 
+  // ========== Theme Management ==========
   function initTheme() {
     const stored = localStorage.getItem('codeclone_theme');
     const prefersDark = window.matchMedia('(prefers-color-scheme: dark)').matches;
     const hour = new Date().getHours();
     const isNight = hour < 7 || hour > 19;
 
-    const theme = stored || (prefersDark || isNight ? 'dark' : 'light');
-    htmlEl.setAttribute('data-theme', theme);
+    state.theme = stored || (prefersDark || isNight ? 'dark' : 'light');
+    document.documentElement.setAttribute('data-theme', state.theme);
   }
 
   function toggleTheme() {
-    const cur = htmlEl.getAttribute('data-theme') || 'dark';
-    const next = cur === 'dark' ? 'light' : 'dark';
-    htmlEl.setAttribute('data-theme', next);
-    localStorage.setItem('codeclone_theme', next);
-    showToast(`Switched to $${next} theme`, 'info');
+    state.theme = state.theme === 'dark' ? 'light' : 'dark';
+    document.documentElement.setAttribute('data-theme', state.theme);
+    localStorage.setItem('codeclone_theme', state.theme);
+    if (state.chartVisible) renderComplexityChart();
+    showToast('Theme switched to ' + state.theme, 'info');
   }
 
-  initTheme();
-  btnTheme?.addEventListener('click', toggleTheme);
-
   // ========== Toast Notifications ==========
   function showToast(message, type = 'info') {
     const icons = {
-      info: 'i',
-      success: 'ok',
-      warning: '!',
-      error: 'x'
+      info: ICONS.info,
+      success: ICONS.success,
+      warning: ICONS.warning,
+      error: ICONS.error
     };
 
     const toast = document.createElement('div');
-    toast.className = `toast toast-$${type}`;
-    toast.innerHTML = `
-      <span class="toast-icon">$${icons[type]}</span>
-      <span class="toast-message">$${message}</span>
-      <button class="toast-close" aria-label="Close">x</button>
-    `;
-
-    const container = document.querySelector('.toast-container');
+    toast.className = 'toast toast-' + type;
+    toast.innerHTML =
+      '<span class="toast-icon">' + icons[type] + '</span>' +
+      '<span class="toast-message">' + message + '</span>' +
+      '<button class="toast-close" aria-label="Close">x</button>';
+
+    const container = $$('.toast-container');
     container.appendChild(toast);
 
-    // Trigger animation
     setTimeout(() => toast.classList.add('toast-show'), 10);
 
-    // Close button
     toast.querySelector('.toast-close').addEventListener('click', () => {
       toast.classList.remove('toast-show');
       setTimeout(() => toast.remove(), 300);
     });
 
-    // Auto-remove
     setTimeout(() => {
       toast.classList.remove('toast-show');
       setTimeout(() => toast.remove(), 300);
     }, 4000);
   }
 
-  // Make showToast global for use in other scripts
   window.showToast = showToast;
 
+  // ========== Command Palette ==========
+  function initCommandPalette() {
+    const palette = $$('#command-palette');
+    const input = $$('#command-input');
+    const results = $$('#command-results');
+    if (!palette || !input || !results) return;
+    let selectedIndex = -1;
+
+    const commands = [
+      {
+        section: 'Actions',
+        items: [
+          {
+            icon: ICONS.exportJson,
+            label: 'Export as JSON',
+            shortcut: '⌘E',
+            action: () => exportReport('json')
+          },
+          {
+            icon: ICONS.exportPdf,
+            label: 'Export as PDF',
+            shortcut: null,
+            action: () => exportReport('pdf')
+          },
+          {
+            icon: ICONS.stats,
+            label: 'Toggle Statistics',
+            shortcut: '⌘S',
+            action: () => showStats()
+          },
+          {
+            icon: ICONS.charts,
+            label: 'Toggle Charts',
+            shortcut: null,
+            action: () => showCharts()
+          },
+          {
+            icon: ICONS.refresh,
+            label: 'Refresh View',
+            shortcut: '⌘R',
+            action: () => location.reload()
+          }
+        ]
+      },
+      {
+        section: 'Navigation',
+        items: [
+          {
+            icon: ICONS.search,
+            label: 'Focus Search',
+            shortcut: '/',
+            action: () => {
+              const search = getPrimarySearchInput();
+              if (!search) {
+                showToast('Search is not available in this report', 'warning');
+                return;
+              }
+              search.focus();
+              if (typeof search.select === 'function') search.select();
+            }
+          },
+          {
+            icon: ICONS.scrollTop,
+            label: 'Scroll to Top',
+            shortcut: null,
+            action: () => window.scrollTo(0, 0)
+          },
+          {
+            icon: ICONS.scrollBottom,
+            label: 'Scroll to Bottom',
+            shortcut: null,
+            action: () => window.scrollTo(0, document.body.scrollHeight)
+          }
+        ]
+      },
+      {
+        section: 'View',
+        items: [
+          {
+            icon: ICONS.theme,
+            label: 'Toggle Theme',
+            shortcut: 'T',
+            action: () => toggleTheme()
+          },
+          {
+            icon: ICONS.expand,
+            label: 'Expand All',
+            shortcut: null,
+            action: () => expandAll()
+          },
+          {
+            icon: ICONS.collapse,
+            label: 'Collapse All',
+            shortcut: null,
+            action: () => collapseAll()
+          }
+        ]
+      }
+    ];
+
+    function getVisibleCommandItems() {
+      return Array.from(results.querySelectorAll('.command-item'));
+    }
+
+    function setSelected(index) {
+      const items = getVisibleCommandItems();
+      if (!items.length) {
+        selectedIndex = -1;
+        return;
+      }
+      selectedIndex = (index + items.length) % items.length;
+      items.forEach((item, idx) => {
+        const isSelected = idx === selectedIndex;
+        item.classList.toggle('selected', isSelected);
+        item.setAttribute('aria-selected', isSelected ? 'true' : 'false');
+      });
+      items[selectedIndex].scrollIntoView({ block: 'nearest' });
+    }
+
+    function renderCommands(filter = '') {
+      const f = filter.toLowerCase();
+      results.innerHTML = '';
+      let rendered = 0;
+
+      commands.forEach(section => {
+        const filtered = section.items.filter(item =>
+          !f || item.label.toLowerCase().includes(f)
+        );
+
+        if (filtered.length === 0) return;
+
+        const sectionEl = document.createElement('div');
+        sectionEl.className = 'command-section';
+        sectionEl.innerHTML =
+          '<div class="command-section-title">' +
+          section.section +
+          '</div>';
+
+        filtered.forEach((item) => {
+          const btn = document.createElement('button');
+          btn.className = 'command-item';
+          btn.type = 'button';
+          btn.setAttribute('role', 'option');
+          btn.setAttribute('aria-selected', 'false');
+          btn.innerHTML =
+            '<div class="command-item-left">' +
+            '<span class="command-icon">' + item.icon + '</span>' +
+            '<span>' + item.label + '</span>' +
+            '</div>' +
+            (item.shortcut
+              ? '<kbd class="command-shortcut">' + item.shortcut + '</kbd>'
+              : '');
+          btn.addEventListener('click', () => {
+            item.action();
+            closeCommandPalette();
+          });
+          btn.addEventListener('mouseenter', () => {
+            const items = getVisibleCommandItems();
+            const hoverIndex = items.indexOf(btn);
+            if (hoverIndex >= 0) setSelected(hoverIndex);
+          });
+          sectionEl.appendChild(btn);
+          rendered += 1;
+        });
+
+        results.appendChild(sectionEl);
+      });
+
+      if (rendered === 0) {
+        const empty = document.createElement('div');
+        empty.className = 'command-empty';
+        empty.textContent = 'No matching commands';
+        results.appendChild(empty);
+      }
+      setSelected(0);
+    }
+
+    function openCommandPalette() {
+      state.commandPaletteOpen = true;
+      palette.classList.add('show');
+      palette.setAttribute('aria-hidden', 'false');
+      input.value = '';
+      renderCommands();
+      input.focus();
+    }
+
+    function closeCommandPalette() {
+      state.commandPaletteOpen = false;
+      palette.classList.remove('show');
+      palette.setAttribute('aria-hidden', 'true');
+      input.value = '';
+    }
+
+    $$('#command-btn')?.addEventListener('click', openCommandPalette);
+    $$('.command-backdrop')?.addEventListener('click', closeCommandPalette);
+
+    input?.addEventListener('input', (e) => {
+      renderCommands(e.target.value);
+    });
+
+    input?.addEventListener('keydown', (e) => {
+      if (e.key === 'Escape') {
+        e.preventDefault();
+        closeCommandPalette();
+      } else if (e.key === 'ArrowDown') {
+        e.preventDefault();
+        setSelected(selectedIndex + 1);
+      } else if (e.key === 'ArrowUp') {
+        e.preventDefault();
+        setSelected(selectedIndex - 1);
+      } else if (e.key === 'Enter') {
+        e.preventDefault();
+        const selected = $$('.command-item.selected');
+        if (selected) selected.click();
+      }
+    });
+
+    window.openCommandPalette = openCommandPalette;
+    window.closeCommandPalette = closeCommandPalette;
+  }
+
+  // ========== Statistics ==========
+  function calculateStats() {
+    const groups = $$$$('.group');
+    const items = $$$$('.item');
+
+    state.stats.totalGroups = groups.length;
+    state.stats.totalItems = items.length;
+    state.stats.avgGroupSize = groups.length > 0
+      ? Math.round(items.length / groups.length)
+      : 0;
+
+    let largest = 0;
+    groups.forEach(g => {
+      const count = g.querySelectorAll('.item').length;
+      if (count > largest) largest = count;
+    });
+    state.stats.largestGroup = largest;
+  }
+
+  function showStats() {
+    const dashboard = $$('#stats-dashboard');
+    if (!dashboard) return;
+
+    const isVisible = dashboard.style.display !== 'none';
+    if (isVisible) {
+      dashboard.style.display = 'none';
+      showToast('Statistics hidden', 'info');
+      return;
+    }
+
+    calculateStats();
+
+    const stats = [
+      {
+        icon: ICONS.cloneGroups,
+        value: state.stats.totalGroups,
+        label: 'Clone Groups',
+        trend: null
+      },
+      {
+        icon: ICONS.totalClones,
+        value: state.stats.totalItems,
+        label: 'Total Clones',
+        trend: null
+      },
+      {
+        icon: ICONS.avgGroup,
+        value: state.stats.avgGroupSize,
+        label: 'Avg Group Size',
+        trend: null
+      },
+      {
+        icon: ICONS.largestGroup,
+        value: state.stats.largestGroup,
+        label: 'Largest Group',
+        trend: null
+      }
+    ];
+
+    dashboard.innerHTML = stats.map(s => {
+      const trend = s.trend
+        ? '<div class="stat-trend ' + s.trend.type + '">' + s.trend.text + '</div>'
+        : '';
+      return (
+        '<div class="stat-card">' +
+        '<div class="stat-icon">' + s.icon + '</div>' +
+        '<div class="stat-value">' + s.value + '</div>' +
+        '<div class="stat-label">' + s.label + '</div>' +
+        trend +
+        '</div>'
+      );
+    }).join('');
+
+    dashboard.style.display = 'grid';
+    showToast('Statistics displayed', 'success');
+  }
+
+  function collectSectionMetrics() {
+    const sections = [
+      { id: 'functions', label: 'Function', colorVar: '--accent-primary' },
+      { id: 'blocks', label: 'Block', colorVar: '--success' },
+      { id: 'segments', label: 'Segment', colorVar: '--warning' }
+    ];
+    return sections.map((section) => {
+      const groups = Array.from($$$$('.group[data-group="' + section.id + '"]'));
+      return {
+        label: section.label,
+        colorVar: section.colorVar,
+        value: groups.length
+      };
+    });
+  }
+
+  function renderComplexityChart() {
+    const canvas = $$('#complexity-chart');
+    if (!canvas) return;
+    const ctx = canvas.getContext('2d');
+    if (!ctx) return;
+
+    const rect = canvas.getBoundingClientRect();
+    const width = Math.max(320, Math.floor(rect.width || 320));
+    const height = Math.max(220, Math.floor(rect.height || 300));
+    const ratio = Math.max(1, window.devicePixelRatio || 1);
+
+    canvas.width = Math.floor(width * ratio);
+    canvas.height = Math.floor(height * ratio);
+    ctx.setTransform(ratio, 0, 0, ratio, 0, 0);
+    ctx.clearRect(0, 0, width, height);
+
+    const styles = getComputedStyle(document.documentElement);
+    const textPrimary = styles.getPropertyValue('--text-primary').trim() || '#d1d5db';
+    const textMuted = styles.getPropertyValue('--text-muted').trim() || '#9ca3af';
+    const gridColor = styles.getPropertyValue('--border-subtle').trim() || '#334155';
+    const sansFont =
+      'ui-sans-serif, -apple-system, BlinkMacSystemFont, Segoe UI, sans-serif';
+
+    const metrics = collectSectionMetrics();
+    const maxValue = Math.max(1, ...metrics.map((m) => m.value));
+    const yMax = Math.max(4, Math.ceil(maxValue / 4) * 4);
+    const left = 52;
+    const right = 18;
+    const top = 16;
+    const bottom = 40;
+    const chartWidth = width - left - right;
+    const chartHeight = height - top - bottom;
+
+    ctx.strokeStyle = gridColor;
+    ctx.lineWidth = 1;
+    for (let step = 0; step <= 4; step += 1) {
+      const y = top + (chartHeight * step) / 4;
+      ctx.beginPath();
+      ctx.moveTo(left, y);
+      ctx.lineTo(left + chartWidth, y);
+      ctx.stroke();
+
+      const value = Math.round(yMax - (yMax * step) / 4);
+      ctx.fillStyle = textMuted;
+      ctx.font = '12px ' + sansFont;
+      ctx.textAlign = 'right';
+      ctx.fillText(String(value), left - 8, y + 4);
+    }
+
+    const slot = chartWidth / metrics.length;
+    const barWidth = Math.max(40, Math.min(90, slot * 0.56));
+    metrics.forEach((metric, idx) => {
+      const x = left + slot * idx + (slot - barWidth) / 2;
+      const barHeight = (metric.value / yMax) * chartHeight;
+      const y = top + chartHeight - barHeight;
+      const color = styles.getPropertyValue(metric.colorVar).trim() || '#4f46e5';
+
+      ctx.fillStyle = color;
+      ctx.fillRect(x, y, barWidth, barHeight);
+
+      ctx.fillStyle = textPrimary;
+      ctx.font = '600 12px ' + sansFont;
+      ctx.textAlign = 'center';
+      ctx.fillText(String(metric.value), x + barWidth / 2, y - 6);
+
+      ctx.fillStyle = textMuted;
+      ctx.font = '12px ' + sansFont;
+      ctx.fillText(metric.label, x + barWidth / 2, top + chartHeight + 18);
+    });
+
+    if (metrics.every((metric) => metric.value === 0)) {
+      ctx.fillStyle = textMuted;
+      ctx.font = '14px ' + sansFont;
+      ctx.textAlign = 'center';
+      ctx.fillText(
+        'No clone groups to visualize',
+        left + chartWidth / 2,
+        top + chartHeight / 2
+      );
+    }
+  }
+
+  // ========== Charts ==========
+  function showCharts() {
+    const container = $$('#chart-container');
+    if (!container) return;
+    const visible = container.style.display !== 'none';
+    if (visible) {
+      container.style.display = 'none';
+      state.chartVisible = false;
+      showToast('Charts hidden', 'info');
+      return;
+    }
+    container.style.display = 'block';
+    state.chartVisible = true;
+    renderComplexityChart();
+    showToast('Charts displayed', 'success');
+  }
+
+  function readReportMetaFromDom() {
+    const metaEl = $$('#report-meta');
+    if (!metaEl) return {};
+
+    const boolAttr = (name) => {
+      const value = (metaEl.getAttribute(name) || '').toLowerCase();
+      if (value === 'true') return true;
+      if (value === 'false') return false;
+      return null;
+    };
+    const textAttr = (name) => {
+      const value = (metaEl.getAttribute(name) || '').trim();
+      return value || null;
+    };
+    const intAttr = (name) => {
+      const value = textAttr(name);
+      if (value === null) return null;
+      const parsed = Number(value);
+      return Number.isFinite(parsed) ? parsed : null;
+    };
+
+    return {
+      codeclone_version: textAttr('data-codeclone-version'),
+      python_version: textAttr('data-python-version'),
+      baseline_path: textAttr('data-baseline-path'),
+      baseline_version: textAttr('data-baseline-version'),
+      baseline_schema_version: intAttr('data-baseline-schema-version'),
+      baseline_python_version: textAttr('data-baseline-python-version'),
+      baseline_loaded: boolAttr('data-baseline-loaded'),
+      baseline_status: textAttr('data-baseline-status'),
+      cache_path: textAttr('data-cache-path'),
+      cache_used: boolAttr('data-cache-used')
+    };
+  }
+
+  // ========== Export ==========
+  function exportReport(format) {
+    calculateStats();
+    if (format === 'json') {
+      const groups = Array.from($$$$('.group')).map((groupEl) => ({
+        section: groupEl.getAttribute('data-group') || '',
+        group_index: Number(groupEl.getAttribute('data-group-index') || '0'),
+        group_key: groupEl.getAttribute('data-group-key') || '',
+        items: Array.from(groupEl.querySelectorAll('.item')).map((itemEl) => ({
+          qualname: itemEl.getAttribute('data-qualname') || '',
+          filepath: itemEl.getAttribute('data-filepath') || '',
+          start_line: Number(itemEl.getAttribute('data-start-line') || '0'),
+          end_line: Number(itemEl.getAttribute('data-end-line') || '0')
+        }))
+      }));
+      const data = {
+        generated: new Date().toISOString(),
+        source: 'CodeClone HTML report',
+        meta: readReportMetaFromDom(),
+        stats: state.stats,
+        groups
+      };
+
+      const blob = new Blob([JSON.stringify(data, null, 2)], {
+        type: 'application/json'
+      });
+      const url = URL.createObjectURL(blob);
+      const a = document.createElement('a');
+      a.href = url;
+      a.download = 'codeclone-report-' + Date.now() + '.json';
+      a.click();
+      URL.revokeObjectURL(url);
+
+      showToast('Report exported as JSON', 'success');
+      return;
+    }
+
+    if (format === 'pdf') {
+      showToast('Opening print dialog for PDF export', 'info');
+      window.print();
+      return;
+    }
+
+    showToast('Unsupported export format: ' + format, 'warning');
+  }
+
+  // ========== Group Controls ==========
+  function expandAll() {
+    $$$$('.items').forEach(b => b.style.display = '');
+    $$$$('[data-toggle-group]').forEach(c => c.style.transform = 'rotate(0deg)');
+    showToast('All groups expanded', 'info');
+  }
+
+  function collapseAll() {
+    $$$$('.items').forEach(b => b.style.display = 'none');
+    $$$$('[data-toggle-group]').forEach(c => c.style.transform = 'rotate(-90deg)');
+    showToast('All groups collapsed', 'info');
+  }
+
   // ========== Keyboard Shortcuts ==========
   document.addEventListener('keydown', (e) => {
-    // / - Focus search
-    if (e.key === '/' && !e.metaKey && !e.ctrlKey) {
+    const key = String(e.key || '').toLowerCase();
+
+    // Command Palette: ⌘K or Ctrl+K
+    if ((e.metaKey || e.ctrlKey) && key === 'k') {
       e.preventDefault();
-      const search = document.querySelector('.search');
-      if (search) {
-        search.focus();
-        search.select();
+      if (state.commandPaletteOpen) {
+        window.closeCommandPalette?.();
+      } else {
+        window.openCommandPalette?.();
       }
+      return;
     }
 
-    // T - Toggle theme
-    if (e.key === 't' || e.key === 'T') {
-      if (!e.target.matches('input, textarea')) {
+    if (state.commandPaletteOpen) {
+      if (key === 'escape') {
         e.preventDefault();
-        toggleTheme();
+        window.closeCommandPalette?.();
       }
+      return;
+    }
+
+    // Don't trigger if typing in input
+    const target = e.target;
+    if (
+      target &&
+      typeof target.matches === 'function' &&
+      target.matches('input, textarea, [contenteditable="true"]')
+    ) {
+      return;
+    }
+
+    // / - Focus search
+    if (key === '/') {
+      e.preventDefault();
+      const search = getPrimarySearchInput();
+      search?.focus();
+      if (search && typeof search.select === 'function') search.select();
+    }
+
+    // T - Toggle theme
+    if (key === 't') {
+      e.preventDefault();
+      toggleTheme();
+    }
+
+    // S - Show stats
+    if ((e.metaKey || e.ctrlKey) && key === 's') {
+      e.preventDefault();
+      showStats();
+    }
+
+    // E - Export
+    if ((e.metaKey || e.ctrlKey) && key === 'e') {
+      e.preventDefault();
+      exportReport('json');
+    }
+
+    // R - Refresh view
+    if ((e.metaKey || e.ctrlKey) && key === 'r') {
+      e.preventDefault();
+      location.reload();
     }
 
-    // Escape - Clear search / close modals
-    if (e.key === 'Escape') {
-      const search = document.querySelector('.search');
+    // Escape - Close modals
+    if (key === 'escape') {
+      const search = getPrimarySearchInput();
       if (search && search.value) {
         search.value = '';
         search.dispatchEvent(new Event('input', { bubbles: true }));
@@ -1104,7 +2260,7 @@
   });
 
   // ========== Group Toggle ==========
-  document.querySelectorAll('.group-head').forEach((head) => {
+  $$$$('.group-head').forEach((head) => {
     head.addEventListener('click', (e) => {
       if (e.target.closest('button')) return;
       const btn = head.querySelector('[data-toggle-group]');
@@ -1112,11 +2268,11 @@
     });
   });
 
-  document.querySelectorAll('[data-toggle-group]').forEach((btn) => {
+  $$$$('[data-toggle-group]').forEach((btn) => {
     btn.addEventListener('click', (e) => {
       e.stopPropagation();
       const id = btn.getAttribute('data-toggle-group');
-      const body = document.getElementById('group-body-' + id);
+      const body = $$('#group-body-' + id);
       if (!body) return;
 
       const isHidden = body.style.display === 'none';
@@ -1127,23 +2283,21 @@
 
   // ========== Section Management ==========
   function initSection(sectionId) {
-    const section = document.querySelector(`section[data-section='$${sectionId}']`);
+    const section = $$('section[data-section="' + sectionId + '"]');
     if (!section) return;
 
-    const groups = Array.from(
-      section.querySelectorAll(`.group[data-group='$${sectionId}']`)
-    );
-    const searchInput = document.getElementById(`search-$${sectionId}`);
-    const btnPrev = section.querySelector(`[data-prev='$${sectionId}']`);
-    const btnNext = section.querySelector(`[data-next='$${sectionId}']`);
-    const meta = section.querySelector(`[data-page-meta='$${sectionId}']`);
-    const selPageSize = section.querySelector(`[data-pagesize='$${sectionId}']`);
-    const btnClear = section.querySelector(`[data-clear='$${sectionId}']`);
-    const btnCollapseAll = section.querySelector(`[data-collapse-all='$${sectionId}']`);
-    const btnExpandAll = section.querySelector(`[data-expand-all='$${sectionId}']`);
-    const pill = section.querySelector(`[data-count-pill='$${sectionId}']`);
-
-    const state = {
+    const groups = Array.from($$$$('.group[data-group="' + sectionId + '"]'));
+    const searchInput = $$('#search-' + sectionId);
+    const btnPrev = $$('[data-prev="' + sectionId + '"]');
+    const btnNext = $$('[data-next="' + sectionId + '"]');
+    const meta = $$('[data-page-meta="' + sectionId + '"]');
+    const selPageSize = $$('[data-pagesize="' + sectionId + '"]');
+    const btnClear = $$('[data-clear="' + sectionId + '"]');
+    const btnCollapseAll = $$('[data-collapse-all="' + sectionId + '"]');
+    const btnExpandAll = $$('[data-expand-all="' + sectionId + '"]');
+    const pill = $$('[data-count-pill="' + sectionId + '"]');
+
+    const sectionState = {
       q: '',
       page: 1,
       pageSize: parseInt(selPageSize?.value || '10', 10),
@@ -1155,62 +2309,71 @@
     }
 
     function render() {
-      const total = state.filtered.length;
-      const pageSize = Math.max(1, state.pageSize);
+      const total = sectionState.filtered.length;
+      const pageSize = Math.max(1, sectionState.pageSize);
       const pages = Math.max(1, Math.ceil(total / pageSize));
-      state.page = Math.min(Math.max(1, state.page), pages);
+      sectionState.page = Math.min(Math.max(1, sectionState.page), pages);
 
-      const start = (state.page - 1) * pageSize;
+      const start = (sectionState.page - 1) * pageSize;
       const end = Math.min(total, start + pageSize);
 
       groups.forEach(g => setGroupVisible(g, false));
-      state.filtered.slice(start, end).forEach(g => setGroupVisible(g, true));
-
-      if (meta) meta.textContent = `Page $${state.page} / $${pages} • $${total} groups`;
-      if (pill) pill.textContent = `$${total} groups`;
+      sectionState.filtered.slice(start, end).forEach(g => setGroupVisible(g, true));
+
+      if (meta) {
+        meta.textContent =
+          'Page ' +
+          sectionState.page +
+          ' / ' +
+          pages +
+          ' • ' +
+          total +
+          ' groups';
+      }
+      if (pill) pill.textContent = total + ' groups';
 
-      if (btnPrev) btnPrev.disabled = state.page <= 1;
-      if (btnNext) btnNext.disabled = state.page >= pages;
+      if (btnPrev) btnPrev.disabled = sectionState.page <= 1;
+      if (btnNext) btnNext.disabled = sectionState.page >= pages;
     }
 
     function applyFilter() {
-      const q = (state.q || '').trim().toLowerCase();
+      const q = (sectionState.q || '').trim().toLowerCase();
       if (!q) {
-        state.filtered = groups;
+        sectionState.filtered = groups;
       } else {
-        state.filtered = groups.filter(g => {
+        sectionState.filtered = groups.filter(g => {
           const blob = g.getAttribute('data-search') || '';
           return blob.indexOf(q) !== -1;
         });
       }
-      state.page = 1;
+      sectionState.page = 1;
       render();
     }
 
     searchInput?.addEventListener('input', (e) => {
-      state.q = e.target.value || '';
+      sectionState.q = e.target.value || '';
       applyFilter();
     });
 
     btnClear?.addEventListener('click', () => {
       if (searchInput) searchInput.value = '';
-      state.q = '';
+      sectionState.q = '';
       applyFilter();
     });
 
     selPageSize?.addEventListener('change', () => {
-      state.pageSize = parseInt(selPageSize.value || '10', 10);
-      state.page = 1;
+      sectionState.pageSize = parseInt(selPageSize.value || '10', 10);
+      sectionState.page = 1;
       render();
     });
 
     btnPrev?.addEventListener('click', () => {
-      state.page -= 1;
+      sectionState.page -= 1;
       render();
     });
 
     btnNext?.addEventListener('click', () => {
-      state.page += 1;
+      sectionState.page += 1;
       render();
     });
 
@@ -1235,28 +2398,60 @@
     render();
   }
 
-  initSection('functions');
-  initSection('blocks');
-
-  // ========== Export Functionality ==========
-  document.getElementById('export-btn')?.addEventListener('click', () => {
-    showToast('Export functionality coming soon!', 'info');
+  // ========== Event Listeners ==========
+  $$('#theme-toggle')?.addEventListener('click', toggleTheme);
+  $$('#export-btn')?.addEventListener('click', () => exportReport('json'));
+  window.addEventListener('resize', () => {
+    if (state.chartVisible) renderComplexityChart();
   });
 
-  // ========== Page Load Animation ==========
-  document.querySelectorAll('.section').forEach((section, index) => {
-    section.style.animationDelay = `$${index * 0.1}s`;
-  });
+  // ========== Meta Panel Toggle ==========
+  function initMetaPanel() {
+    const header = $$('.meta-header');
+    const toggle = $$('.meta-toggle');
+    const content = $$('.meta-content');
+
+    if (!header || !toggle || !content) return;
+
+    // Start collapsed by default to save space
+    const startCollapsed = true;
+    if (startCollapsed) {
+      toggle.classList.add('collapsed');
+      content.classList.add('collapsed');
+    }
+
+    header.addEventListener('click', (e) => {
+      const isCollapsed = toggle.classList.contains('collapsed');
 
-  // Show welcome toast
+      if (isCollapsed) {
+        toggle.classList.remove('collapsed');
+        content.classList.remove('collapsed');
+      } else {
+        toggle.classList.add('collapsed');
+        content.classList.add('collapsed');
+      }
+    });
+  }
+
+  // ========== Initialize ==========
+  initTheme();
+  initCommandPalette();
+  initMetaPanel();
+  initSection('functions');
+  initSection('blocks');
+  initSection('segments');
+  calculateStats();
+
+  // Welcome message
   setTimeout(() => {
-    const groupCount = document.querySelectorAll('.group').length;
+    const groupCount = $$$$('.group').length;
     if (groupCount > 0) {
-      showToast(`Found $${groupCount} clone groups`, 'success');
+      showToast(groupCount + ' clone groups loaded', 'success');
     }
   }, 500);
 })();
 </script>
 </body>
 </html>
-""")
+"""
+)
diff --git a/codeclone/ui_messages.py b/codeclone/ui_messages.py
new file mode 100644
index 0000000..a777deb
--- /dev/null
+++ b/codeclone/ui_messages.py
@@ -0,0 +1,257 @@
+from __future__ import annotations
+
+from pathlib import Path
+
+BANNER_SUBTITLE = "[italic]Architectural duplication detector[/italic]"
+
+HELP_VERSION = "Print the CodeClone version and exit."
+HELP_ROOT = "Project root directory to scan."
+HELP_MIN_LOC = "Minimum Lines of Code (LOC) to consider."
+HELP_MIN_STMT = "Minimum AST statements to consider."
+HELP_PROCESSES = "Number of parallel worker processes."
+HELP_CACHE_PATH = "Path to the cache file. Default: <root>/.cache/codeclone/cache.json."
+HELP_CACHE_DIR_LEGACY = "Legacy alias for --cache-path."
+HELP_MAX_BASELINE_SIZE_MB = "Maximum baseline file size in MB."
+HELP_MAX_CACHE_SIZE_MB = "Maximum cache file size in MB."
+HELP_BASELINE = "Path to the baseline file (stored in repo)."
+HELP_UPDATE_BASELINE = "Overwrite the baseline file with current results."
+HELP_FAIL_ON_NEW = "Exit with error if NEW clones (not in baseline) are detected."
+HELP_FAIL_THRESHOLD = (
+    "Exit with error if total clone groups (function + block) exceed this number."
+)
+HELP_CI = "CI preset: --fail-on-new --no-color --quiet."
+HELP_HTML = "Generate an HTML report to FILE."
+HELP_JSON = "Generate a JSON report to FILE."
+HELP_TEXT = "Generate a text report to FILE."
+HELP_NO_PROGRESS = "Disable the progress bar (recommended for CI logs)."
+HELP_NO_COLOR = "Disable ANSI colors in output."
+HELP_QUIET = "Minimize output (still shows warnings and errors)."
+HELP_VERBOSE = "Print detailed hash identifiers for new clones."
+
+SUMMARY_TITLE = "Analysis Summary"
+SUMMARY_LABEL_FILES_FOUND = "Files found"
+SUMMARY_LABEL_FILES_ANALYZED = "Files analyzed"
+SUMMARY_LABEL_CACHE_HITS = "Cache hits"
+SUMMARY_LABEL_FILES_SKIPPED = "Files skipped"
+SUMMARY_LABEL_FUNCTION = "Function clone groups"
+SUMMARY_LABEL_BLOCK = "Block clone groups"
+SUMMARY_LABEL_SEGMENT = "Segment clone groups"
+SUMMARY_LABEL_SUPPRESSED = "Suppressed segment groups"
+SUMMARY_LABEL_NEW_BASELINE = "New vs baseline"
+SUMMARY_COMPACT_INPUT = (
+    "Input: found={found} analyzed={analyzed} cache_hits={cache_hits} skipped={skipped}"
+)
+SUMMARY_COMPACT_CLONES = (
+    "Clone groups: function={function} block={block} "
+    "segment={segment} suppressed={suppressed} new_vs_baseline={new}"
+)
+WARN_SUMMARY_ACCOUNTING_MISMATCH = (
+    "Summary accounting mismatch: "
+    "files_found != files_analyzed + cache_hits + files_skipped"
+)
+
+STATUS_DISCOVERING = "[bold green]Discovering Python files..."
+STATUS_GROUPING = "[bold green]Grouping clones..."
+
+INFO_SCANNING_ROOT = "[info]Scanning root:[/info] {root}"
+INFO_PROCESSING_CHANGED = "[info]Processing {count} changed files...[/info]"
+INFO_HTML_REPORT_SAVED = "[info]HTML report saved:[/info] {path}"
+INFO_JSON_REPORT_SAVED = "[info]JSON report saved:[/info] {path}"
+INFO_TEXT_REPORT_SAVED = "[info]Text report saved:[/info] {path}"
+
+WARN_SKIPPING_FILE = "[warning]Skipping file {path}: {error}[/warning]"
+WARN_WORKER_FAILED = "[warning]Worker failed: {error}[/warning]"
+WARN_BATCH_ITEM_FAILED = "[warning]Failed to process batch item: {error}[/warning]"
+WARN_PARALLEL_FALLBACK = (
+    "[warning]Parallel processing unavailable, "
+    "falling back to sequential: {error}[/warning]"
+)
+WARN_FAILED_FILES_HEADER = "\n[warning]{count} files failed to process:[/warning]"
+WARN_CACHE_SAVE_FAILED = "[warning]Failed to save cache: {error}[/warning]"
+
+ERR_INVALID_OUTPUT_EXT = (
+    "[error]Invalid {label} output extension: {path} "
+    "(expected {expected_suffix}).[/error]"
+)
+ERR_ROOT_NOT_FOUND = "[error]Root path does not exist: {path}[/error]"
+ERR_INVALID_ROOT_PATH = "[error]Invalid root path: {error}[/error]"
+ERR_SCAN_FAILED = "[error]Scan failed: {error}[/error]"
+
+WARN_LEGACY_CACHE = (
+    "[warning]Legacy cache file found at: {legacy_path}.[/warning]\n"
+    "[warning]Cache is now stored per-project at: {new_path}.[/warning]\n"
+    "[warning]Please delete the legacy cache file and add "
+    ".cache/ to .gitignore.[/warning]"
+)
+
+ERR_INVALID_BASELINE = (
+    "[error]Invalid baseline file.[/error]\n"
+    "{error}\n"
+    "Please regenerate the baseline with --update-baseline."
+)
+ERR_BASELINE_VERSION_MISMATCH = "[error]Baseline version mismatch.[/error]"
+ERR_BASELINE_SCHEMA_MISMATCH = "[error]Baseline schema version mismatch.[/error]"
+WARN_BASELINE_PYTHON_MISMATCH = "[warning]Baseline Python version mismatch.[/warning]"
+ERR_BASELINE_SAME_PYTHON_REQUIRED = (
+    "[error]Baseline checks require the same Python version to "
+    "ensure deterministic results. Please regenerate the "
+    "baseline using the current interpreter.[/error]"
+)
+WARN_BASELINE_MISSING = (
+    "[warning]Baseline file not found at: [bold]{path}[/bold][/warning]\n"
+    "[dim]Comparing against an empty baseline. "
+    "Use --update-baseline to create it.[/dim]"
+)
+WARN_BASELINE_IGNORED = (
+    "[warning]Baseline is not trusted for this run and will be ignored.[/warning]\n"
+    "[dim]Comparison will proceed against an empty baseline.[/dim]"
+)
+SUCCESS_BASELINE_UPDATED = "✔ Baseline updated: {path}"
+
+FAIL_NEW_TITLE = "[error]FAILED: New code clones detected.[/error]"
+FAIL_NEW_SUMMARY_TITLE = "Summary:"
+FAIL_NEW_FUNCTION = "- New function clone groups: {count}"
+FAIL_NEW_BLOCK = "- New block clone groups: {count}"
+FAIL_NEW_REPORT_TITLE = "See detailed report:"
+FAIL_NEW_ACCEPT_TITLE = "To accept these clones as technical debt, run:"
+FAIL_NEW_ACCEPT_COMMAND = "  codeclone . --update-baseline"
+FAIL_NEW_DETAIL_FUNCTION = "Details (function clone hashes):"
+FAIL_NEW_DETAIL_BLOCK = "Details (block clone hashes):"
+
+ERR_FAIL_THRESHOLD = (
+    "\n[error]❌ FAILED: Total clones ({total}) exceed threshold ({threshold})![/error]"
+)
+WARN_NEW_CLONES_WITHOUT_FAIL = (
+    "\n[warning]New clones detected but --fail-on-new not set.[/warning]\n"
+    "Run with --update-baseline to accept them as technical debt."
+)
+
+
+def version_output(version: str) -> str:
+    return f"CodeClone {version}"
+
+
+def banner_title(version: str) -> str:
+    return (
+        f"[bold white]CodeClone[/bold white] [dim]v{version}[/dim]\n{BANNER_SUBTITLE}"
+    )
+
+
+def fmt_invalid_output_extension(
+    *, label: str, path: Path, expected_suffix: str
+) -> str:
+    return ERR_INVALID_OUTPUT_EXT.format(
+        label=label, path=path, expected_suffix=expected_suffix
+    )
+
+
+def fmt_scanning_root(root: Path) -> str:
+    return INFO_SCANNING_ROOT.format(root=root)
+
+
+def fmt_processing_changed(count: int) -> str:
+    return INFO_PROCESSING_CHANGED.format(count=count)
+
+
+def fmt_skipping_file(path: str, error: object) -> str:
+    return WARN_SKIPPING_FILE.format(path=path, error=error)
+
+
+def fmt_worker_failed(error: object) -> str:
+    return WARN_WORKER_FAILED.format(error=error)
+
+
+def fmt_batch_item_failed(error: object) -> str:
+    return WARN_BATCH_ITEM_FAILED.format(error=error)
+
+
+def fmt_parallel_fallback(error: object) -> str:
+    return WARN_PARALLEL_FALLBACK.format(error=error)
+
+
+def fmt_failed_files_header(count: int) -> str:
+    return WARN_FAILED_FILES_HEADER.format(count=count)
+
+
+def fmt_cache_save_failed(error: object) -> str:
+    return WARN_CACHE_SAVE_FAILED.format(error=error)
+
+
+def fmt_legacy_cache_warning(*, legacy_path: Path, new_path: Path) -> str:
+    return WARN_LEGACY_CACHE.format(legacy_path=legacy_path, new_path=new_path)
+
+
+def fmt_invalid_baseline(error: object) -> str:
+    return ERR_INVALID_BASELINE.format(error=error)
+
+
+def fmt_baseline_version_missing(current_version: str) -> str:
+    return (
+        f"{ERR_BASELINE_VERSION_MISMATCH}\n"
+        "Baseline version missing (legacy baseline format).\n"
+        f"Current version: {current_version}.\n"
+        "Please regenerate the baseline with --update-baseline."
+    )
+
+
+def fmt_baseline_version_mismatch(
+    *, baseline_version: str, current_version: str
+) -> str:
+    return (
+        f"{ERR_BASELINE_VERSION_MISMATCH}\n"
+        "Baseline was generated with CodeClone "
+        f"{baseline_version}.\n"
+        f"Current version: {current_version}.\n"
+        "Please regenerate the baseline with --update-baseline."
+    )
+
+
+def fmt_baseline_schema_mismatch(*, baseline_schema: int, current_schema: int) -> str:
+    return (
+        f"{ERR_BASELINE_SCHEMA_MISMATCH}\n"
+        f"Baseline schema: {baseline_schema}. "
+        f"Current schema: {current_schema}.\n"
+        "Please regenerate the baseline with --update-baseline."
+    )
+
+
+def fmt_baseline_python_mismatch(*, baseline_python: str, current_python: str) -> str:
+    return (
+        f"{WARN_BASELINE_PYTHON_MISMATCH}\n"
+        "Baseline was generated with Python "
+        f"{baseline_python}.\n"
+        f"Current interpreter: Python {current_python}."
+    )
+
+
+def fmt_path(template: str, path: Path) -> str:
+    return template.format(path=path)
+
+
+def fmt_summary_compact_input(
+    *, found: int, analyzed: int, cache_hits: int, skipped: int
+) -> str:
+    return SUMMARY_COMPACT_INPUT.format(
+        found=found, analyzed=analyzed, cache_hits=cache_hits, skipped=skipped
+    )
+
+
+def fmt_summary_compact_clones(
+    *,
+    function: int,
+    block: int,
+    segment: int,
+    suppressed: int,
+    new: int,
+) -> str:
+    return SUMMARY_COMPACT_CLONES.format(
+        function=function,
+        block=block,
+        segment=segment,
+        suppressed=suppressed,
+        new=new,
+    )
+
+
+def fmt_fail_threshold(*, total: int, threshold: int) -> str:
+    return ERR_FAIL_THRESHOLD.format(total=total, threshold=threshold)
diff --git a/docs/architecture.md b/docs/architecture.md
index c87d4a7..2722a19 100644
--- a/docs/architecture.md
+++ b/docs/architecture.md
@@ -13,15 +13,23 @@ CodeClone processes Python projects in the following stages:
 3. **AST normalization**
 4. **CFG construction**
 5. **Fingerprinting**
-6. **Clone grouping**
-7. **Reporting / CI decision**
+6. **Segment window extraction**
+7. **Clone grouping**
+8. **Reporting / CI decision**
 
 ---
 
 ## 1. Source Scanning
 
 - Recursively scans `.py` files.
+- Uses deterministic sorted traversal.
+- Skips paths that resolve outside the root (symlink traversal guard).
 - Applies cache-based skipping using file stat signatures.
+- Default cache location is project-local: `<root>/.cache/codeclone/cache.json`
+  (override via `--cache-path`, legacy alias: `--cache-dir`).
+- Cache file size guard is configurable via `--max-cache-size-mb` (oversized cache is ignored with warning).
+- Cache is best-effort: signature/version/shape mismatches are ignored with warnings, and
+  invalid entries are skipped deterministically.
 
 ---
 
@@ -39,7 +47,10 @@ Normalization removes non-structural noise:
 - variable names → `_VAR_`
 - constants → `_CONST_`
 - attributes → `_ATTR_`
+- symbolic call targets are preserved (to avoid API conflation)
 - syntactic sugar (e.g. `x += 1` → `x = x + 1`)
+- commutative operand canonicalization (`+`, `*`, `|`, `&`, `^`) on proven constant domains
+- local logical equivalence (`not (x in y)` → `x not in y`, `not (x is y)` → `x is not y`)
 - docstrings removed
 - type annotations removed
 
@@ -52,6 +63,11 @@ This ensures structural stability across refactors.
 - Built per-function using `CFGBuilder`.
 - Produces deterministic basic blocks.
 - Captures structural control flow (`if`, `for`, `while`, `try`, `with`, `match`).
+- Models short‑circuit `and`/`or` as micro‑CFG branches.
+- Links `try/except` only from statements that may raise.
+- Preserves `match case` and `except` handler order structurally.
+- Models `break` / `continue` as terminating loop transitions.
+- Preserves `for/while ... else` semantics.
 
 📄 See [docs/cfg.md](cfg.md) for full semantics.
 
@@ -65,7 +81,17 @@ This fingerprint is used to group structurally identical functions.
 
 ---
 
-## 6. Clone Detection
+## 6. Segment Windows
+
+Large functions are also scanned with **segment windows** (sliding windows over normalized
+statements). These are used to detect **internal clones** inside the same function.
+
+Segment windows are **never** used as a final equivalence signal; they are candidate
+generators with strict hash confirmation.
+
+---
+
+## 7. Clone Detection
 
 Two clone types are detected:
 
@@ -86,7 +112,18 @@ Noise filters applied:
 
 ---
 
-## 7. Reporting
+### Segment clones (internal)
+
+- Detected only **inside the same function**.
+- Used for internal copy‑paste discovery and report explainability.
+- Not included in baseline or CI failure logic.
+- Report UX merges overlapping segment windows and suppresses boilerplate‑only groups.
+- A segment group is reported only if it has at least **2** unique statement types
+  or contains a control‑flow statement.
+
+---
+
+## 8. Reporting
 
 Detected clone groups can be:
 
@@ -94,6 +131,18 @@ Detected clone groups can be:
 - exported as JSON,
 - rendered as an interactive HTML report.
 
+All report formats include provenance metadata:
+
+- `codeclone_version`
+- `python_version`
+- `baseline_path`
+- `baseline_version`
+- `baseline_schema_version`
+- `baseline_python_version`
+- `baseline_loaded`
+- `baseline_status`
+  (`ok | missing | legacy | invalid | mismatch_version | mismatch_schema | mismatch_python | generator_mismatch | integrity_missing | integrity_failed | too_large`)
+
 ---
 
 ## CI Integration
@@ -101,6 +150,26 @@ Detected clone groups can be:
 Baseline comparison allows CI to fail **only on new clones**,
 enabling gradual architectural improvement.
 
+Baseline files are **versioned**. The baseline stores the CodeClone version and schema
+version used to generate it. Mismatches result in a hard stop and require regeneration.
+Baseline format in 1.3+ is tamper-evident (`generator`, `payload_sha256`) and validated
+before baseline diffing.
+
+Baseline validation order is deterministic:
+
+1. size guard (before JSON parse),
+2. JSON parse and root object/type checks,
+3. legacy/version/schema policy checks,
+4. Python version policy check,
+5. integrity checks (`generator`, `payload_sha256`) for v1.3+ baseline format only.
+
+Baseline loading is strict: schema/type violations, integrity failures, generator mismatch,
+or oversized files are treated as untrusted input.
+In `--fail-on-new` / `--ci`, untrusted baseline states fail fast.
+Outside gating mode, untrusted baseline is ignored with warning and comparison proceeds
+against an empty baseline.
+Baseline size guard is configurable via `--max-baseline-size-mb`.
+
 ## Python Version Consistency for Baseline Checks
 
 Due to inherent differences in Python’s AST between interpreter versions, baseline
diff --git a/docs/cfg.md b/docs/cfg.md
index 1106771..21589da 100644
--- a/docs/cfg.md
+++ b/docs/cfg.md
@@ -82,6 +82,9 @@ An `if` statement creates:
 
 Both branches always reconverge at an explicit after-block.
 
+If the condition is a short‑circuit boolean (`and`/`or`), it is expanded into a
+**micro‑CFG** with one block per operand and explicit branch edges between them.
+
 ---
 
 ### `while` loops
@@ -90,12 +93,13 @@ A `while` loop produces:
 
 - a loop condition block,
 - a body block,
+- an optional `else` block,
 - an after-loop block.
 
 The condition block always has two successors:
 
 - loop body,
-- after-loop.
+- else/after-loop path.
 
 ---
 
@@ -105,6 +109,7 @@ A `for` loop is modeled similarly to `while`:
 
 - an iteration-expression block,
 - a body block,
+- an optional `else` block,
 - an after-loop block.
 
 The iterable expression (`range(...)`, etc.) is represented as a statement
@@ -114,42 +119,25 @@ inside the condition block.
 
 ## `break` and `continue` Semantics (CFG v1)
 
-### Current behavior
-
 In CFG v1:
 
-- `break` and `continue` are represented as **explicit blocks**,
-- they are treated as **structural statements**, not precise jumps,
-- they do **not** resolve exact runtime jump targets.
-
-Example:
+- `break` and `continue` are explicit terminating statements,
+- each maps to a deterministic jump target through loop context:
+  - `break` -> loop after-block,
+  - `continue` -> loop condition/iteration block,
+- `for/while ... else` remains reachable only on normal loop completion
+  (not through `break` paths).
 
-```python
-for x in xs:
-    if cond:
-        continue
-    process(x)
-```
-
-The CFG records:
-
-- presence of `continue`,
-- its position in the control structure,
-
-but does not encode a direct jump back to the loop header.
+This preserves structural loop semantics while keeping deterministic graph shape.
 
 ---
 
-### Rationale
-
-Precise modeling of `break` / `continue`:
+## Ordered Branch Semantics
 
-- significantly increases CFG complexity,
-- creates many structurally distinct but semantically similar graphs,
-- destabilizes structural fingerprints.
+To avoid false equivalence from branch reordering, CFG v1 preserves:
 
-For clone detection, the **presence and position** of these statements
-is more important than their exact runtime behavior.
+- `match case` evaluation order via indexed case-test blocks,
+- `except` handler order via indexed handler-test blocks.
 
 ---
 
@@ -170,12 +158,15 @@ is more important than their exact runtime behavior.
 
 ---
 
-### No exception flow
+### Limited exception flow
 
-- `try / except / finally` blocks are represented only structurally.
-- No exceptional control-flow edges are created.
+- `try / except / finally` blocks are represented structurally.
+- `try/except` edges are created **only** from statements that may raise:
+  function calls, attribute access, indexing, `await`, `yield from`, and `raise`.
+- No interprocedural exception propagation is modeled.
 
-This avoids CFG explosion and keeps fingerprints stable.
+This keeps CFGs deterministic while reducing false differences between safe and
+potentially‑raising code.
 
 ---
 
@@ -219,8 +210,7 @@ CFG v1 is intentionally **structural, conservative, and explainable**.
 
 Potential future enhancements:
 
-- precise jump targets for `break` / `continue`,
-- basic exception-flow modeling,
+- richer exception-flow modeling,
 - optional data-flow fingerprints,
 - configurable strictness modes.
 
diff --git a/pyproject.toml b/pyproject.toml
index b839edf..4de9503 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
 
 [project]
 name = "codeclone"
-version = "1.2.1"
+version = "1.3.0"
 description = "AST and CFG-based code clone detector for Python focused on architectural duplication"
 readme = { file = "README.md", content-type = "text/markdown" }
 license = { text = "MIT" }
@@ -65,7 +65,8 @@ dev = [
     "build>=1.2.0",
     "twine>=5.0.0",
     "mypy>=1.19.1",
-    "ruff>=0.12.0",
+    "ruff>=0.15.0",
+    "pre-commit>=4.5.1",
 ]
 
 [project.scripts]
@@ -88,7 +89,7 @@ source = ["codeclone"]
 
 [tool.coverage.report]
 show_missing = true
-fail_under = 98
+fail_under = 99
 
 [tool.mypy]
 python_version = "3.10"
diff --git a/tests/test_baseline.py b/tests/test_baseline.py
index 6247183..9c98489 100644
--- a/tests/test_baseline.py
+++ b/tests/test_baseline.py
@@ -3,7 +3,9 @@
 
 import pytest
 
+import codeclone.baseline as baseline_mod
 from codeclone.baseline import Baseline
+from codeclone.errors import BaselineSchemaError
 
 
 def test_baseline_diff() -> None:
@@ -32,11 +34,19 @@ def test_baseline_io(tmp_path: Path) -> None:
     assert content["functions"] == ["f1", "f2"]
     assert content["blocks"] == ["b1"]
     assert "python_version" not in content
+    assert "baseline_version" in content
+    assert "schema_version" in content
+    assert content["generator"] == "codeclone"
+    assert isinstance(content["payload_sha256"], str)
+    assert isinstance(content["created_at"], str)
 
     bl2 = Baseline(f)
     bl2.load()
+    bl2.verify_integrity()
     assert bl2.functions == {"f1", "f2"}
     assert bl2.blocks == {"b1"}
+    assert isinstance(bl2.baseline_version, str)
+    assert bl2.schema_version == 1
 
 
 def test_baseline_load_missing(tmp_path: Path) -> None:
@@ -51,18 +61,206 @@ def test_baseline_load_corrupted(tmp_path: Path) -> None:
     f = tmp_path / "corrupt.json"
     f.write_text("{invalid json", "utf-8")
     bl = Baseline(f)
-    with pytest.raises(ValueError, match="Corrupted baseline file"):
+    with pytest.raises(BaselineSchemaError, match="Corrupted baseline file"):
         bl.load()
 
 
+def test_baseline_load_non_object_payload(tmp_path: Path) -> None:
+    f = tmp_path / "not_object.json"
+    f.write_text("[]", "utf-8")
+    bl = Baseline(f)
+    with pytest.raises(BaselineSchemaError, match="must be an object"):
+        bl.load()
+
+
+def test_baseline_load_stat_error(
+    tmp_path: Path, monkeypatch: pytest.MonkeyPatch
+) -> None:
+    f = tmp_path / "baseline.json"
+    f.write_text(json.dumps({"functions": [], "blocks": []}), "utf-8")
+    original_exists = Path.exists
+    original_stat = Path.stat
+
+    def _exists(self: Path) -> bool:
+        if self == f:
+            return True
+        return original_exists(self)
+
+    def _boom(self: Path, *args: object, **kwargs: object) -> object:
+        if self == f:
+            raise OSError("blocked")
+        return original_stat(self)
+
+    monkeypatch.setattr(Path, "exists", _exists)
+    monkeypatch.setattr(Path, "stat", _boom)
+    bl = Baseline(f)
+    with pytest.raises(BaselineSchemaError, match="Cannot stat baseline file"):
+        bl.load()
+
+
+def test_baseline_load_invalid_schema(tmp_path: Path) -> None:
+    f = tmp_path / "invalid.json"
+    f.write_text(
+        json.dumps({"functions": ["f1"], "blocks": [1], "schema_version": 1}),
+        "utf-8",
+    )
+    bl = Baseline(f)
+    with pytest.raises(BaselineSchemaError, match="Invalid baseline schema"):
+        bl.load()
+
+
+def test_baseline_load_invalid_created_at_type(tmp_path: Path) -> None:
+    f = tmp_path / "invalid_created_at.json"
+    f.write_text(
+        json.dumps(
+            {
+                "functions": [],
+                "blocks": [],
+                "baseline_version": "1.3.0",
+                "schema_version": 1,
+                "created_at": 123,
+            }
+        ),
+        "utf-8",
+    )
+    bl = Baseline(f)
+    with pytest.raises(BaselineSchemaError, match="'created_at' must be string"):
+        bl.load()
+
+
+def test_baseline_load_invalid_schema_version_type(tmp_path: Path) -> None:
+    f = tmp_path / "invalid_schema_version.json"
+    f.write_text(
+        json.dumps(
+            {
+                "functions": [],
+                "blocks": [],
+                "baseline_version": "1.3.0",
+                "schema_version": "1",
+            }
+        ),
+        "utf-8",
+    )
+    bl = Baseline(f)
+    with pytest.raises(BaselineSchemaError, match="'schema_version' must be integer"):
+        bl.load()
+
+
+def test_baseline_load_too_large(
+    tmp_path: Path, monkeypatch: pytest.MonkeyPatch
+) -> None:
+    f = tmp_path / "large.json"
+    f.write_text(json.dumps({"functions": [], "blocks": []}), "utf-8")
+    monkeypatch.setattr(baseline_mod, "MAX_BASELINE_SIZE_BYTES", 1)
+    bl = Baseline(f)
+    with pytest.raises(BaselineSchemaError, match="too large"):
+        bl.load()
+
+
+def test_baseline_integrity_missing_payload(tmp_path: Path) -> None:
+    f = tmp_path / "missing_payload.json"
+    f.write_text(
+        json.dumps(
+            {
+                "functions": ["f1"],
+                "blocks": ["b1"],
+                "baseline_version": "1.3.0",
+                "schema_version": 1,
+                "generator": "codeclone",
+            }
+        ),
+        "utf-8",
+    )
+    bl = Baseline(f)
+    bl.load()
+    with pytest.raises(BaselineSchemaError, match="payload hash is missing"):
+        bl.verify_integrity()
+
+
+def test_baseline_integrity_generator_mismatch(tmp_path: Path) -> None:
+    f = tmp_path / "generator_mismatch.json"
+    bl = Baseline(f)
+    bl.functions = {"f1"}
+    bl.blocks = {"b1"}
+    bl.save()
+    payload = json.loads(f.read_text("utf-8"))
+    payload["generator"] = "evil"
+    f.write_text(json.dumps(payload), "utf-8")
+    bl2 = Baseline(f)
+    bl2.load()
+    with pytest.raises(BaselineSchemaError, match="generator mismatch"):
+        bl2.verify_integrity()
+
+
+def test_baseline_integrity_generator_wrong_type(tmp_path: Path) -> None:
+    f = tmp_path / "generator_wrong_type.json"
+    bl = Baseline(f)
+    bl.functions = {"f1"}
+    bl.blocks = {"b1"}
+    bl.save()
+    payload = json.loads(f.read_text("utf-8"))
+    payload["generator"] = 123
+    f.write_text(json.dumps(payload), "utf-8")
+    bl2 = Baseline(f)
+    bl2.load()
+    with pytest.raises(BaselineSchemaError, match="generator mismatch"):
+        bl2.verify_integrity()
+
+
+def test_baseline_integrity_payload_mismatch(tmp_path: Path) -> None:
+    f = tmp_path / "tampered.json"
+    bl = Baseline(f)
+    bl.functions = {"f1"}
+    bl.blocks = {"b1"}
+    bl.save()
+    payload = json.loads(f.read_text("utf-8"))
+    payload["functions"] = ["tampered"]
+    f.write_text(json.dumps(payload), "utf-8")
+    bl2 = Baseline(f)
+    bl2.load()
+    with pytest.raises(BaselineSchemaError, match="payload_sha256 mismatch"):
+        bl2.verify_integrity()
+
+
+def test_baseline_integrity_payload_wrong_type(tmp_path: Path) -> None:
+    f = tmp_path / "payload_wrong_type.json"
+    bl = Baseline(f)
+    bl.functions = {"f1"}
+    bl.blocks = {"b1"}
+    bl.save()
+    payload = json.loads(f.read_text("utf-8"))
+    payload["payload_sha256"] = 1
+    f.write_text(json.dumps(payload), "utf-8")
+    bl2 = Baseline(f)
+    bl2.load()
+    with pytest.raises(BaselineSchemaError, match="payload hash is missing"):
+        bl2.verify_integrity()
+
+
+def test_baseline_verify_integrity_skips_legacy(tmp_path: Path) -> None:
+    f = tmp_path / "legacy.json"
+    f.write_text(json.dumps({"functions": [], "blocks": []}), "utf-8")
+    bl = Baseline(f)
+    bl.load()
+    bl.verify_integrity()
+
+
 def test_baseline_from_groups() -> None:
     func_groups: dict[str, object] = {"f1": [], "f2": []}
     block_groups: dict[str, object] = {"b1": []}
-    bl = Baseline.from_groups(func_groups, block_groups, path="custom.json")
+    bl = Baseline.from_groups(
+        func_groups,
+        block_groups,
+        path="custom.json",
+        baseline_version="1.3.0",
+        schema_version=1,
+    )
 
     assert bl.functions == {"f1", "f2"}
     assert bl.blocks == {"b1"}
     assert bl.path == Path("custom.json")
+    assert bl.baseline_version == "1.3.0"
+    assert bl.schema_version == 1
 
 
 def test_baseline_python_version_roundtrip(tmp_path: Path) -> None:
@@ -75,7 +273,24 @@ def test_baseline_python_version_roundtrip(tmp_path: Path) -> None:
 
     content = json.loads(f.read_text("utf-8"))
     assert content["python_version"] == "3.13"
+    assert "baseline_version" in content
+    assert content["schema_version"] == 1
 
     bl2 = Baseline(f)
     bl2.load()
     assert bl2.python_version == "3.13"
+    assert isinstance(bl2.baseline_version, str)
+    assert bl2.schema_version == 1
+
+
+def test_baseline_payload_without_created_at() -> None:
+    payload = baseline_mod._baseline_payload(
+        {"f1"},
+        {"b1"},
+        python_version=None,
+        baseline_version="1.3.0",
+        schema_version=1,
+        generator="codeclone",
+        created_at=None,
+    )
+    assert "created_at" not in payload
diff --git a/tests/test_cache.py b/tests/test_cache.py
index f0bca78..160c9bb 100644
--- a/tests/test_cache.py
+++ b/tests/test_cache.py
@@ -7,7 +7,8 @@
 
 import pytest
 
-from codeclone.blocks import BlockUnit
+import codeclone.cache as cache_mod
+from codeclone.blocks import BlockUnit, SegmentUnit
 from codeclone.cache import Cache
 from codeclone.errors import CacheError
 from codeclone.extractor import Unit
@@ -37,12 +38,27 @@ def _make_block(filepath: str) -> BlockUnit:
     )
 
 
+def _make_segment(filepath: str) -> SegmentUnit:
+    return SegmentUnit(
+        segment_hash="s1",
+        segment_sig="sig1",
+        filepath=filepath,
+        qualname="mod:func",
+        start_line=1,
+        end_line=6,
+        size=6,
+    )
+
+
 def test_cache_roundtrip(tmp_path: Path) -> None:
     cache_path = tmp_path / "cache.json"
     cache = Cache(cache_path)
     unit = _make_unit("x.py")
     block = _make_block("x.py")
-    cache.put_file_entry("x.py", {"mtime_ns": 1, "size": 10}, [unit], [block])
+    segment = _make_segment("x.py")
+    cache.put_file_entry(
+        "x.py", {"mtime_ns": 1, "size": 10}, [unit], [block], [segment]
+    )
     cache.save()
 
     loaded = Cache(cache_path)
@@ -56,7 +72,7 @@ def test_cache_roundtrip(tmp_path: Path) -> None:
 def test_cache_signature_mismatch_warns(tmp_path: Path) -> None:
     cache_path = tmp_path / "cache.json"
     cache = Cache(cache_path)
-    cache.put_file_entry("x.py", {"mtime_ns": 1, "size": 10}, [], [])
+    cache.put_file_entry("x.py", {"mtime_ns": 1, "size": 10}, [], [], [])
     cache.save()
 
     data = json.loads(cache_path.read_text("utf-8"))
@@ -89,6 +105,18 @@ def test_cache_version_mismatch_warns(tmp_path: Path) -> None:
     assert loaded.data["files"] == {}
 
 
+def test_cache_too_large_warns(tmp_path: Path, monkeypatch: pytest.MonkeyPatch) -> None:
+    cache_path = tmp_path / "cache.json"
+    cache_path.write_text(json.dumps({"version": Cache.CACHE_VERSION, "files": {}}))
+    monkeypatch.setattr(cache_mod, "MAX_CACHE_SIZE_BYTES", 1)
+    cache = Cache(cache_path)
+    cache.load()
+    assert cache.load_warning is not None
+    assert "too large" in cache.load_warning
+    assert cache.data["version"] == Cache.CACHE_VERSION
+    assert cache.data["files"] == {}
+
+
 def test_cache_entry_validation(tmp_path: Path) -> None:
     cache_path = tmp_path / "cache.json"
     cache = Cache(cache_path)
@@ -96,6 +124,206 @@ def test_cache_entry_validation(tmp_path: Path) -> None:
     assert cache.get_file_entry("x.py") is None
 
 
+def test_cache_entry_invalid_stat_types(tmp_path: Path) -> None:
+    cache = Cache(tmp_path / "cache.json")
+    cache.data["files"]["x.py"] = cast(
+        Any,
+        {
+            "stat": {"mtime_ns": "1", "size": 1},
+            "units": [],
+            "blocks": [],
+            "segments": [],
+        },
+    )
+    assert cache.get_file_entry("x.py") is None
+
+
+def test_cache_entry_stat_not_dict(tmp_path: Path) -> None:
+    cache = Cache(tmp_path / "cache.json")
+    cache.data["files"]["x.py"] = cast(
+        Any,
+        {
+            "stat": [],
+            "units": [],
+            "blocks": [],
+            "segments": [],
+        },
+    )
+    assert cache.get_file_entry("x.py") is None
+
+
+def test_cache_entry_invalid_units_container_type(tmp_path: Path) -> None:
+    cache = Cache(tmp_path / "cache.json")
+    cache.data["files"]["x.py"] = cast(
+        Any,
+        {
+            "stat": {"mtime_ns": 1, "size": 1},
+            "units": {},
+            "blocks": [],
+            "segments": [],
+        },
+    )
+    assert cache.get_file_entry("x.py") is None
+
+
+def test_cache_entry_unit_item_not_dict(tmp_path: Path) -> None:
+    cache = Cache(tmp_path / "cache.json")
+    cache.data["files"]["x.py"] = cast(
+        Any,
+        {
+            "stat": {"mtime_ns": 1, "size": 1},
+            "units": ["bad"],
+            "blocks": [],
+            "segments": [],
+        },
+    )
+    assert cache.get_file_entry("x.py") is None
+
+
+def test_cache_entry_invalid_unit_field_type(tmp_path: Path) -> None:
+    cache = Cache(tmp_path / "cache.json")
+    cache.data["files"]["x.py"] = cast(
+        Any,
+        {
+            "stat": {"mtime_ns": 1, "size": 1},
+            "units": [
+                {
+                    "qualname": "q",
+                    "filepath": "x.py",
+                    "start_line": "1",
+                    "end_line": 2,
+                    "loc": 2,
+                    "stmt_count": 1,
+                    "fingerprint": "fp",
+                    "loc_bucket": "0-19",
+                }
+            ],
+            "blocks": [],
+            "segments": [],
+        },
+    )
+    assert cache.get_file_entry("x.py") is None
+
+
+def test_cache_entry_block_item_not_dict(tmp_path: Path) -> None:
+    cache = Cache(tmp_path / "cache.json")
+    cache.data["files"]["x.py"] = cast(
+        Any,
+        {
+            "stat": {"mtime_ns": 1, "size": 1},
+            "units": [],
+            "blocks": ["bad"],
+            "segments": [],
+        },
+    )
+    assert cache.get_file_entry("x.py") is None
+
+
+def test_cache_entry_invalid_block_field_type(tmp_path: Path) -> None:
+    cache = Cache(tmp_path / "cache.json")
+    cache.data["files"]["x.py"] = cast(
+        Any,
+        {
+            "stat": {"mtime_ns": 1, "size": 1},
+            "units": [],
+            "blocks": [
+                {
+                    "block_hash": "h",
+                    "filepath": "x.py",
+                    "qualname": "q",
+                    "start_line": 1,
+                    "end_line": 2,
+                    "size": "4",
+                }
+            ],
+            "segments": [],
+        },
+    )
+    assert cache.get_file_entry("x.py") is None
+
+
+def test_cache_entry_segment_item_not_dict(tmp_path: Path) -> None:
+    cache = Cache(tmp_path / "cache.json")
+    cache.data["files"]["x.py"] = cast(
+        Any,
+        {
+            "stat": {"mtime_ns": 1, "size": 1},
+            "units": [],
+            "blocks": [],
+            "segments": ["bad"],
+        },
+    )
+    assert cache.get_file_entry("x.py") is None
+
+
+def test_cache_entry_invalid_segment_field_type(tmp_path: Path) -> None:
+    cache = Cache(tmp_path / "cache.json")
+    cache.data["files"]["x.py"] = cast(
+        Any,
+        {
+            "stat": {"mtime_ns": 1, "size": 1},
+            "units": [],
+            "blocks": [],
+            "segments": [
+                {
+                    "segment_hash": "h",
+                    "segment_sig": "sig",
+                    "filepath": "x.py",
+                    "qualname": "q",
+                    "start_line": 1,
+                    "end_line": 2,
+                    "size": "6",
+                }
+            ],
+        },
+    )
+    assert cache.get_file_entry("x.py") is None
+
+
+def test_cache_entry_valid_deep_schema(tmp_path: Path) -> None:
+    cache = Cache(tmp_path / "cache.json")
+    cache.data["files"]["x.py"] = cast(
+        Any,
+        {
+            "stat": {"mtime_ns": 1, "size": 1},
+            "units": [
+                {
+                    "qualname": "q",
+                    "filepath": "x.py",
+                    "start_line": 1,
+                    "end_line": 2,
+                    "loc": 2,
+                    "stmt_count": 1,
+                    "fingerprint": "fp",
+                    "loc_bucket": "0-19",
+                }
+            ],
+            "blocks": [
+                {
+                    "block_hash": "h",
+                    "filepath": "x.py",
+                    "qualname": "q",
+                    "start_line": 1,
+                    "end_line": 2,
+                    "size": 4,
+                }
+            ],
+            "segments": [
+                {
+                    "segment_hash": "h",
+                    "segment_sig": "sig",
+                    "filepath": "x.py",
+                    "qualname": "q",
+                    "start_line": 1,
+                    "end_line": 2,
+                    "size": 6,
+                }
+            ],
+        },
+    )
+    assert cache.get_file_entry("x.py") is not None
+
+
 def test_cache_load_missing_file(tmp_path: Path) -> None:
     cache_path = tmp_path / "missing.json"
     cache = Cache(cache_path)
@@ -196,3 +424,14 @@ def _raise_chmod(self: Path, _mode: int) -> None:
 
     cache = Cache(cache_path)
     assert isinstance(cache.secret, bytes)
+
+
+def test_cache_secret_non_posix(
+    tmp_path: Path, monkeypatch: pytest.MonkeyPatch
+) -> None:
+    cache_path = tmp_path / "cache.json"
+    monkeypatch.setattr("codeclone.cache.OS_NAME", "nt")
+    cache = Cache(cache_path)
+    secret_path = cache_path.parent / ".cache_secret"
+    assert secret_path.exists()
+    assert isinstance(cache.secret, bytes)
diff --git a/tests/test_cfg.py b/tests/test_cfg.py
index abe945d..71e25ee 100644
--- a/tests/test_cfg.py
+++ b/tests/test_cfg.py
@@ -4,6 +4,11 @@
 import pytest
 
 from codeclone.cfg import CFG, CFGBuilder
+from codeclone.cfg_model import CFG as CFGModel
+from codeclone.cfg_model import Block
+from codeclone.extractor import get_cfg_fingerprint
+from codeclone.meta_markers import CFG_META_PREFIX
+from codeclone.normalize import NormalizationConfig
 
 
 def build_cfg_from_source(source: str) -> CFG:
@@ -30,6 +35,57 @@ def cfg_to_str(cfg: CFG) -> str:
     return "\n".join(lines)
 
 
+def _const_meta_value(stmt: ast.stmt) -> str | None:
+    if not isinstance(stmt, ast.Expr):
+        return None
+    if not isinstance(stmt.value, ast.Name):
+        return None
+    if not isinstance(stmt.value.id, str):
+        return None
+    return stmt.value.id
+
+
+def _parse_function(
+    source: str, *, skip_reason: str | None = None
+) -> ast.FunctionDef | ast.AsyncFunctionDef:
+    try:
+        module = ast.parse(dedent(source))
+    except SyntaxError:
+        if skip_reason:
+            pytest.skip(skip_reason)
+        raise
+    for node in ast.walk(module):
+        if isinstance(node, (ast.FunctionDef, ast.AsyncFunctionDef)):
+            return node
+    raise AssertionError("Expected at least one function in source")
+
+
+def _cfg_fingerprint(
+    source: str, qualname: str, *, skip_reason: str | None = None
+) -> str:
+    func = _parse_function(source, skip_reason=skip_reason)
+    cfg = NormalizationConfig()
+    return get_cfg_fingerprint(func, cfg, qualname)
+
+
+def _assert_fingerprint_diff(
+    source_a: str, source_b: str, *, skip_reason: str | None = None
+) -> None:
+    fp_a = _cfg_fingerprint(source_a, "m:f", skip_reason=skip_reason)
+    fp_b = _cfg_fingerprint(source_b, "m:g", skip_reason=skip_reason)
+    assert fp_a != fp_b
+
+
+def _single_return_block(cfg: CFG) -> Block:
+    return_blocks = [
+        block
+        for block in cfg.blocks
+        if any(isinstance(stmt, ast.Return) for stmt in block.statements)
+    ]
+    assert len(return_blocks) == 1
+    return return_blocks[0]
+
+
 def test_cfg_if_else() -> None:
     source = """
     def f(a):
@@ -56,6 +112,51 @@ def f(a):
     assert cfg_str.strip() == dedent(expected).strip()
 
 
+def test_cfg_if_with_boolop_and() -> None:
+    source = """
+    def f(a, b):
+        if a and b:
+            x = 1
+        else:
+            x = 2
+    """
+    cfg_str = cfg_to_str(build_cfg_from_source(source))
+    expected = """
+Block 0 -> [3, 5]
+  Expr(value=Name(id='a', ctx=Load()))
+Block 1 -> []
+Block 2 -> [4]
+  Assign(targets=[Name(id='x', ctx=Store())], value=Constant(value=1))
+Block 3 -> [4]
+  Assign(targets=[Name(id='x', ctx=Store())], value=Constant(value=2))
+Block 4 -> [1]
+Block 5 -> [2, 3]
+  Expr(value=Name(id='b', ctx=Load()))
+"""
+    assert cfg_str.strip() == dedent(expected).strip()
+
+
+def test_cfg_while_with_boolop_or() -> None:
+    source = """
+    def f(a, b):
+        while a or b:
+            x = 1
+    """
+    cfg_str = cfg_to_str(build_cfg_from_source(source))
+    expected = """
+Block 0 -> [2]
+Block 1 -> []
+Block 2 -> [3, 5]
+  Expr(value=Name(id='a', ctx=Load()))
+Block 3 -> [2]
+  Assign(targets=[Name(id='x', ctx=Store())], value=Constant(value=1))
+Block 4 -> [1]
+Block 5 -> [3, 4]
+  Expr(value=Name(id='b', ctx=Load()))
+"""
+    assert cfg_str.strip() == dedent(expected).strip()
+
+
 def test_cfg_while_loop() -> None:
     source = """
     def f():
@@ -216,6 +317,23 @@ def f():
     assert has_else_assign
 
 
+def test_cfg_try_else_return_terminates() -> None:
+    source = """
+    def f():
+        try:
+            x = 1
+        except ValueError:
+            pass
+        else:
+            return 1
+    """
+    cfg = build_cfg_from_source(source)
+    assert any(
+        any(isinstance(stmt, ast.Return) for stmt in block.statements)
+        for block in cfg.blocks
+    )
+
+
 def test_cfg_try_return_in_body() -> None:
     source = """
     def f():
@@ -328,12 +446,12 @@ def f(x):
 
 
 def test_cfg_try_handler_linking() -> None:
-    """Test that statements inside try block are linked to handlers."""
+    """Test that only potentially raising statements inside try link to handlers."""
     code = """
     def f():
         try:
             x = 1
-            y = 2
+            y = risky()
         except ValueError:
             pass
     """
@@ -346,9 +464,8 @@ def f():
         b
         for b in cfg.blocks
         if any(
-            isinstance(s, ast.Expr)
-            and isinstance(s.value, ast.Name)
-            and s.value.id == "ValueError"
+            (meta := _const_meta_value(s)) is not None
+            and meta.startswith(f"{CFG_META_PREFIX}TRY_HANDLER_TYPE:")
             for s in b.statements
         )
     ]
@@ -358,13 +475,103 @@ def f():
 
     predecessors = [b for b in cfg.blocks if handler_block in b.successors]
 
-    has_assignment = False
+    has_call = False
     for pred in predecessors:
         for stmt in pred.statements:
-            if isinstance(stmt, ast.Assign):
-                has_assignment = True
+            if (
+                isinstance(stmt, ast.Assign)
+                and isinstance(stmt.value, ast.Call)
+                and isinstance(stmt.value.func, ast.Name)
+                and stmt.value.func.id == "risky"
+            ):
+                has_call = True
+
+    assert has_call, "Handler should be reachable from potentially raising block"
+
+
+def test_cfg_try_handler_linking_skips_safe_statements() -> None:
+    code = """
+    def f():
+        try:
+            x = 1
+            y = 2
+        except ValueError:
+            pass
+    """
+    func = ast.parse(dedent(code)).body[0]
+    assert isinstance(func, (ast.FunctionDef, ast.AsyncFunctionDef))
+    cfg = CFGBuilder().build("f", func)
+
+    handler_blocks = [
+        b
+        for b in cfg.blocks
+        if any(
+            (meta := _const_meta_value(s)) is not None
+            and meta.startswith(f"{CFG_META_PREFIX}TRY_HANDLER_TYPE:")
+            for s in b.statements
+        )
+    ]
+
+    assert len(handler_blocks) == 1
+    handler_block = handler_blocks[0]
+
+    predecessors = [b for b in cfg.blocks if handler_block in b.successors]
+
+    has_assign_only = any(
+        any(isinstance(stmt, ast.Assign) for stmt in pred.statements)
+        for pred in predecessors
+    )
+
+    assert not has_assign_only, "Safe assignments should not link to handlers"
+
+
+def test_cfg_try_body_breaks_after_termination() -> None:
+    code = """
+    def f():
+        try:
+            return 1
+            x = 2
+        except ValueError:
+            pass
+    """
+    func = ast.parse(dedent(code)).body[0]
+    assert isinstance(func, (ast.FunctionDef, ast.AsyncFunctionDef))
+    cfg = CFGBuilder().build("f", func)
+    assert any(
+        any(isinstance(stmt, ast.Return) for stmt in block.statements)
+        for block in cfg.blocks
+    )
 
-    assert has_assignment, "Handler should be reachable from assignment block"
+
+def test_cfg_try_handler_linking_for_raise() -> None:
+    code = """
+    def f():
+        try:
+            raise ValueError("x")
+        except ValueError:
+            pass
+    """
+    func = ast.parse(dedent(code)).body[0]
+    assert isinstance(func, (ast.FunctionDef, ast.AsyncFunctionDef))
+    cfg = CFGBuilder().build("f", func)
+
+    handler_blocks = [
+        b
+        for b in cfg.blocks
+        if any(
+            (meta := _const_meta_value(s)) is not None
+            and meta.startswith(f"{CFG_META_PREFIX}TRY_HANDLER_TYPE:")
+            for s in b.statements
+        )
+    ]
+    assert len(handler_blocks) == 1
+    handler_block = handler_blocks[0]
+
+    predecessors = [b for b in cfg.blocks if handler_block in b.successors]
+    assert any(
+        any(isinstance(stmt, ast.Raise) for stmt in pred.statements)
+        for pred in predecessors
+    )
 
 
 def test_cfg_try_star() -> None:
@@ -407,11 +614,239 @@ def f(x):
     patterns_found = []
     for block in cfg.blocks:
         for stmt in block.statements:
-            if isinstance(stmt, ast.Expr) and isinstance(stmt.value, ast.Constant):
-                val = stmt.value.value
-                if isinstance(val, str) and val.startswith("PATTERN:"):
-                    patterns_found.append(val)
+            meta = _const_meta_value(stmt)
+            if meta and meta.startswith(f"{CFG_META_PREFIX}MATCH_PATTERN:"):
+                patterns_found.append(meta)
 
     assert len(patterns_found) == 2
     assert "MatchSequence" in patterns_found[0]
     assert "MatchMapping" in patterns_found[1]
+
+
+@pytest.mark.parametrize(
+    ("source_a", "source_b", "skip_reason"),
+    [
+        (
+            """
+    def f(x):
+        match x:
+            case 1 if cond():
+                return 1
+            case _:
+                return 2
+    """,
+            """
+    def f(x):
+        match x:
+            case 1:
+                return 1
+            case _:
+                return 2
+    """,
+            "Match syntax is unavailable",
+        ),
+        (
+            """
+    def f(x):
+        match x:
+            case 1:
+                return 1
+            case _:
+                return 2
+    """,
+            """
+    def g(x):
+        match x:
+            case _:
+                return 2
+            case 1:
+                return 1
+    """,
+            "Match syntax is unavailable",
+        ),
+        (
+            """
+    def f(x):
+        try:
+            return risky(x)
+        except ValueError:
+            return 1
+        except Exception:
+            return 2
+    """,
+            """
+    def g(x):
+        try:
+            return risky(x)
+        except Exception:
+            return 2
+        except ValueError:
+            return 1
+    """,
+            None,
+        ),
+        (
+            """
+    def f(xs):
+        for x in xs:
+            pass
+        else:
+            y = 1
+    """,
+            """
+    def f(xs):
+        for x in xs:
+            pass
+    """,
+            None,
+        ),
+        (
+            """
+    def f(flag):
+        while flag:
+            flag = False
+        else:
+            x = 1
+    """,
+            """
+    def f(flag):
+        while flag:
+            flag = False
+    """,
+            None,
+        ),
+    ],
+    ids=[
+        "match_guard",
+        "match_case_order",
+        "try_handler_order",
+        "for_else",
+        "while_else",
+    ],
+)
+def test_cfg_fingerprint_variants(
+    source_a: str, source_b: str, skip_reason: str | None
+) -> None:
+    _assert_fingerprint_diff(source_a, source_b, skip_reason=skip_reason)
+
+
+@pytest.mark.parametrize(
+    ("keyword", "stmt_type"),
+    [("break", ast.Break), ("continue", ast.Continue)],
+    ids=["break", "continue"],
+)
+def test_cfg_loop_control_terminates_block(
+    keyword: str, stmt_type: type[ast.stmt]
+) -> None:
+    source = f"""
+    def f(xs):
+        for x in xs:
+            {keyword}
+            y = 1
+    """
+    cfg = build_cfg_from_source(source)
+    control_blocks = [
+        block
+        for block in cfg.blocks
+        if any(isinstance(stmt, stmt_type) for stmt in block.statements)
+    ]
+    assert len(control_blocks) == 1
+    control_block = control_blocks[0]
+    assert control_block.is_terminated is True
+    assert all(not isinstance(stmt, ast.Assign) for stmt in control_block.statements)
+
+
+def test_cfg_break_skips_for_else_block() -> None:
+    source = """
+    def f(xs):
+        for x in xs:
+            break
+        else:
+            y = 1
+    """
+    cfg = build_cfg_from_source(source)
+    break_blocks = [
+        b
+        for b in cfg.blocks
+        if any(isinstance(stmt, ast.Break) for stmt in b.statements)
+    ]
+    else_blocks = [
+        b
+        for b in cfg.blocks
+        if any(
+            isinstance(stmt, ast.Assign)
+            and any(isinstance(t, ast.Name) and t.id == "y" for t in stmt.targets)
+            for stmt in b.statements
+        )
+    ]
+    assert len(break_blocks) == 1
+    assert len(else_blocks) == 1
+    assert else_blocks[0] not in break_blocks[0].successors
+
+
+@pytest.mark.parametrize(
+    "source",
+    [
+        """
+    def f(flag):
+        while flag:
+            flag = False
+        else:
+            return 1
+    """,
+        """
+    def f(xs):
+        for x in xs:
+            pass
+        else:
+            return 1
+    """,
+    ],
+    ids=["while_else", "for_else"],
+)
+def test_cfg_loop_else_terminated_branch(source: str) -> None:
+    cfg = build_cfg_from_source(source)
+    return_block = _single_return_block(cfg)
+    assert return_block.is_terminated is True
+    assert cfg.exit in return_block.successors
+
+
+def test_cfg_break_outside_loop_falls_back_to_exit() -> None:
+    builder = CFGBuilder()
+    builder.cfg = CFGModel("m:f")
+    builder.current = builder.cfg.entry
+    builder._visit_break(ast.Break())
+    assert builder.current.is_terminated is True
+    assert builder.cfg.exit in builder.current.successors
+
+
+def test_cfg_continue_outside_loop_falls_back_to_exit() -> None:
+    builder = CFGBuilder()
+    builder.cfg = CFGModel("m:f")
+    builder.current = builder.cfg.entry
+    builder._visit_continue(ast.Continue())
+    assert builder.current.is_terminated is True
+    assert builder.cfg.exit in builder.current.successors
+
+
+def test_cfg_match_with_empty_cases_ast() -> None:
+    # Defensive coverage for the fallback branch when Match.cases is empty.
+    match_stmt = ast.Match(subject=ast.Name(id="x", ctx=ast.Load()), cases=[])
+    fn = ast.FunctionDef(
+        name="f",
+        args=ast.arguments(
+            posonlyargs=[],
+            args=[ast.arg(arg="x")],
+            kwonlyargs=[],
+            kw_defaults=[],
+            defaults=[],
+        ),
+        body=[match_stmt],
+        decorator_list=[],
+    )
+    module = ast.Module(body=[fn], type_ignores=[])
+    module = ast.fix_missing_locations(module)
+    func = module.body[0]
+    assert isinstance(func, ast.FunctionDef)
+    cfg = CFGBuilder().build("f", func)
+    assert len(cfg.blocks) >= 3
diff --git a/tests/test_cli_inprocess.py b/tests/test_cli_inprocess.py
index f9c7a47..e49a232 100644
--- a/tests/test_cli_inprocess.py
+++ b/tests/test_cli_inprocess.py
@@ -1,6 +1,8 @@
 from __future__ import annotations
 
+import hashlib
 import json
+import re
 import sys
 from collections.abc import Callable, Iterable
 from dataclasses import dataclass
@@ -10,8 +12,9 @@
 import pytest
 
 import codeclone.baseline as baseline
-from codeclone import cli
-from codeclone.cache import Cache
+from codeclone import __version__, cli
+from codeclone.baseline import BASELINE_SCHEMA_VERSION
+from codeclone.cache import Cache, file_stat_signature
 from codeclone.errors import CacheError
 
 
@@ -60,6 +63,60 @@ def __exit__(
         return False
 
 
+@dataclass(slots=True)
+class _FixedFuture:
+    value: object | None = None
+    error: Exception | None = None
+
+    def result(self) -> object | None:
+        if self.error:
+            raise self.error
+        return self.value
+
+
+class _FixedExecutor:
+    def __init__(self, future: _FixedFuture, *args: object, **kwargs: object) -> None:
+        self._future = future
+
+    def __enter__(self) -> _FixedExecutor:
+        return self
+
+    def __exit__(
+        self,
+        exc_type: type[BaseException] | None,
+        exc: BaseException | None,
+        tb: object | None,
+    ) -> Literal[False]:
+        return False
+
+    def submit(
+        self, fn: Callable[..., object], *args: object, **kwargs: object
+    ) -> _FixedFuture:
+        return self._future
+
+
+class _DummyProgress:
+    def __init__(self, *args: object, **kwargs: object) -> None:
+        return None
+
+    def __enter__(self) -> _DummyProgress:
+        return self
+
+    def __exit__(
+        self,
+        exc_type: type[BaseException] | None,
+        exc: BaseException | None,
+        tb: object | None,
+    ) -> Literal[False]:
+        return False
+
+    def add_task(self, _desc: str, total: int) -> int:
+        return total
+
+    def advance(self, _task: int) -> None:
+        return None
+
+
 def _patch_parallel(monkeypatch: pytest.MonkeyPatch) -> None:
     monkeypatch.setattr(cli, "ProcessPoolExecutor", _DummyExecutor)
     monkeypatch.setattr(cli, "as_completed", lambda futures: futures)
@@ -70,6 +127,151 @@ def _run_main(monkeypatch: pytest.MonkeyPatch, args: Iterable[str]) -> None:
     cli.main()
 
 
+def _patch_fixed_executor(
+    monkeypatch: pytest.MonkeyPatch, future: _FixedFuture
+) -> None:
+    monkeypatch.setattr(
+        cli, "ProcessPoolExecutor", lambda *args, **kwargs: _FixedExecutor(future)
+    )
+    monkeypatch.setattr(cli, "as_completed", lambda futures: futures)
+
+
+def _baseline_payload(
+    *,
+    functions: list[str] | None = None,
+    blocks: list[str] | None = None,
+    python_version: str | None = None,
+    baseline_version: str | None = None,
+    schema_version: int | None = None,
+    include_version_schema: bool = True,
+    generator: str | None = "codeclone",
+    payload_sha256: str | None = None,
+) -> dict[str, object]:
+    function_list = [] if functions is None else functions
+    block_list = [] if blocks is None else blocks
+    payload: dict[str, object] = {"functions": function_list, "blocks": block_list}
+    if python_version is not None:
+        payload["python_version"] = python_version
+    if include_version_schema:
+        payload["baseline_version"] = baseline_version or __version__
+        payload["schema_version"] = (
+            BASELINE_SCHEMA_VERSION if schema_version is None else schema_version
+        )
+    if generator is not None:
+        payload["generator"] = generator
+    canonical = json.dumps(
+        {"functions": function_list, "blocks": block_list},
+        sort_keys=True,
+        separators=(",", ":"),
+        ensure_ascii=False,
+    )
+    payload["payload_sha256"] = (
+        payload_sha256
+        if payload_sha256 is not None
+        else hashlib.sha256(canonical.encode("utf-8")).hexdigest()
+    )
+    return payload
+
+
+def _write_baseline(
+    path: Path,
+    *,
+    functions: list[str] | None = None,
+    blocks: list[str] | None = None,
+    python_version: str | None = None,
+    baseline_version: str | None = None,
+    schema_version: int | None = None,
+    include_version_schema: bool = True,
+    generator: str | None = "codeclone",
+    payload_sha256: str | None = None,
+) -> Path:
+    path.write_text(
+        json.dumps(
+            _baseline_payload(
+                functions=functions,
+                blocks=blocks,
+                python_version=python_version,
+                baseline_version=baseline_version,
+                schema_version=schema_version,
+                include_version_schema=include_version_schema,
+                generator=generator,
+                payload_sha256=payload_sha256,
+            )
+        ),
+        "utf-8",
+    )
+    return path
+
+
+def _assert_baseline_failure_meta(
+    *,
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+    mutate_payload: Callable[[dict[str, object]], None],
+    expected_message: str,
+    expected_status: str,
+    strict_fail: bool = False,
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f():\n    return 1\n", "utf-8")
+    baseline_path = tmp_path / "baseline.json"
+    payload = _baseline_payload(
+        python_version=f"{sys.version_info.major}.{sys.version_info.minor}",
+    )
+    mutate_payload(payload)
+    baseline_path.write_text(json.dumps(payload), "utf-8")
+    json_out = tmp_path / "report.json"
+
+    _patch_parallel(monkeypatch)
+    args = [
+        str(tmp_path),
+        "--baseline",
+        str(baseline_path),
+        "--json",
+        str(json_out),
+        "--no-progress",
+    ]
+    if strict_fail:
+        args.append("--ci")
+        with pytest.raises(SystemExit) as exc:
+            _run_main(monkeypatch, args)
+        assert exc.value.code == 2
+    else:
+        _run_main(monkeypatch, args)
+    out = capsys.readouterr().out
+    assert expected_message in out
+    if not strict_fail:
+        assert "Baseline is not trusted for this run and will be ignored" in out
+    payload_out = json.loads(json_out.read_text("utf-8"))
+    meta = payload_out["meta"]
+    assert meta["baseline_status"] == expected_status
+    assert meta["baseline_loaded"] is False
+
+
+def _assert_fail_on_new_summary(out: str, *, include_blocks: bool = True) -> None:
+    assert "FAILED: New code clones detected." in out
+    assert "New function clone groups" in out
+    if include_blocks:
+        assert "New block clone groups" in out
+    assert "codeclone . --update-baseline" in out
+
+
+def _summary_metric(out: str, label: str) -> int:
+    match = re.search(rf"{re.escape(label)}:\s+(\d+)", out)
+    if match:
+        return int(match.group(1))
+    match = re.search(rf"{re.escape(label)}\s+[│|]\s+(\d+)", out)
+    assert match, f"summary label not found: {label}\n{out}"
+    return int(match.group(1))
+
+
+def _compact_summary_metric(out: str, key: str) -> int:
+    match = re.search(rf"{re.escape(key)}=(\d+)", out)
+    assert match, f"compact summary key not found: {key}\n{out}"
+    return int(match.group(1))
+
+
 def test_cli_main_no_progress_parallel(
     tmp_path: Path,
     monkeypatch: pytest.MonkeyPatch,
@@ -101,7 +303,306 @@ def f2():
         ],
     )
     out = capsys.readouterr().out
-    assert "Total Function Clones" in out
+    assert "Analysis Summary" in out
+    assert "Function clone groups" in out
+
+
+def test_cli_default_cache_dir_uses_root(
+    tmp_path: Path, monkeypatch: pytest.MonkeyPatch
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f():\n    return 1\n", "utf-8")
+    captured: dict[str, Path] = {}
+
+    class _CacheStub:
+        def __init__(self, path: Path, **_kwargs: object) -> None:
+            captured["path"] = Path(path)
+            self.load_warning = None
+
+        def load(self) -> None:
+            return None
+
+        def get_file_entry(self, _fp: str) -> None:
+            return None
+
+        def put_file_entry(
+            self,
+            _fp: str,
+            _stat: object,
+            _units: object,
+            _blocks: object,
+            _segments: object,
+        ) -> None:
+            return None
+
+        def save(self) -> None:
+            return None
+
+    monkeypatch.setattr(cli, "Cache", _CacheStub)
+    _patch_parallel(monkeypatch)
+    _run_main(monkeypatch, [str(tmp_path), "--no-progress"])
+    assert captured["path"] == tmp_path / ".cache" / "codeclone" / "cache.json"
+
+
+@pytest.mark.parametrize("flag", ["--cache-dir", "--cache-path"])
+def test_cli_cache_dir_override_respected(
+    tmp_path: Path, monkeypatch: pytest.MonkeyPatch, flag: str
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f():\n    return 1\n", "utf-8")
+    captured: dict[str, Path] = {}
+
+    class _CacheStub:
+        def __init__(self, path: Path, **_kwargs: object) -> None:
+            captured["path"] = Path(path)
+            self.load_warning = None
+
+        def load(self) -> None:
+            return None
+
+        def get_file_entry(self, _fp: str) -> None:
+            return None
+
+        def put_file_entry(
+            self,
+            _fp: str,
+            _stat: object,
+            _units: object,
+            _blocks: object,
+            _segments: object,
+        ) -> None:
+            return None
+
+        def save(self) -> None:
+            return None
+
+    cache_path = tmp_path / "custom-cache.json"
+    monkeypatch.setattr(cli, "Cache", _CacheStub)
+    _patch_parallel(monkeypatch)
+    _run_main(
+        monkeypatch,
+        [
+            str(tmp_path),
+            flag,
+            str(cache_path),
+            "--no-progress",
+        ],
+    )
+    assert captured["path"] == cache_path
+
+
+def test_cli_default_cache_dir_per_root(
+    tmp_path: Path, monkeypatch: pytest.MonkeyPatch
+) -> None:
+    root1 = tmp_path / "p1"
+    root2 = tmp_path / "p2"
+    root1.mkdir()
+    root2.mkdir()
+    (root1 / "a.py").write_text("def f():\n    return 1\n", "utf-8")
+    (root2 / "b.py").write_text("def f():\n    return 1\n", "utf-8")
+    captured: list[Path] = []
+
+    class _CacheStub:
+        def __init__(self, path: Path, **_kwargs: object) -> None:
+            captured.append(Path(path))
+            self.load_warning = None
+
+        def load(self) -> None:
+            return None
+
+        def get_file_entry(self, _fp: str) -> None:
+            return None
+
+        def put_file_entry(
+            self,
+            _fp: str,
+            _stat: object,
+            _units: object,
+            _blocks: object,
+            _segments: object,
+        ) -> None:
+            return None
+
+        def save(self) -> None:
+            return None
+
+    monkeypatch.setattr(cli, "Cache", _CacheStub)
+    _patch_parallel(monkeypatch)
+    _run_main(monkeypatch, [str(root1), "--no-progress"])
+    _run_main(monkeypatch, [str(root2), "--no-progress"])
+    assert captured[0] == root1 / ".cache" / "codeclone" / "cache.json"
+    assert captured[1] == root2 / ".cache" / "codeclone" / "cache.json"
+    assert captured[0] != captured[1]
+
+
+def test_cli_cache_not_shared_between_projects(
+    tmp_path: Path, monkeypatch: pytest.MonkeyPatch, capsys: pytest.CaptureFixture[str]
+) -> None:
+    root1 = tmp_path / "p1"
+    root2 = tmp_path / "p2"
+    root1.mkdir()
+    root2.mkdir()
+    legacy_cache = root1 / ".cache" / "codeclone" / "cache.json"
+    legacy_cache.parent.mkdir(parents=True, exist_ok=True)
+    legacy_cache.write_text("{}", "utf-8")
+
+    monkeypatch.setattr(cli, "iter_py_files", lambda _root: [])
+    _patch_parallel(monkeypatch)
+    _run_main(monkeypatch, [str(root2), "--no-progress"])
+    out = capsys.readouterr().out
+    assert "Cache signature mismatch" not in out
+
+
+def test_cli_warns_on_legacy_cache(
+    tmp_path: Path, monkeypatch: pytest.MonkeyPatch, capsys: pytest.CaptureFixture[str]
+) -> None:
+    root = tmp_path / "proj"
+    root.mkdir()
+    (root / "a.py").write_text("def f():\n    return 1\n", "utf-8")
+    legacy_path = tmp_path / "legacy" / "cache.json"
+    legacy_path.parent.mkdir(parents=True, exist_ok=True)
+    legacy_path.write_text("{}", "utf-8")
+    monkeypatch.setattr(cli, "LEGACY_CACHE_PATH", legacy_path)
+    baseline = _write_baseline(
+        root / "baseline.json",
+        python_version=f"{sys.version_info.major}.{sys.version_info.minor}",
+    )
+    _patch_parallel(monkeypatch)
+    _run_main(
+        monkeypatch,
+        [str(root), "--baseline", str(baseline), "--no-progress"],
+    )
+    out = capsys.readouterr().out
+    assert "Legacy cache file found at" in out
+    assert "Cache is now stored per-project" in out
+    assert ".cache/ to .gitignore" in out
+
+
+def test_cli_legacy_cache_resolve_failure(
+    tmp_path: Path, monkeypatch: pytest.MonkeyPatch, capsys: pytest.CaptureFixture[str]
+) -> None:
+    root = tmp_path / "proj"
+    root.mkdir()
+    (root / "a.py").write_text("def f():\n    return 1\n", "utf-8")
+
+    class _LegacyPath:
+        def __init__(self, value: str) -> None:
+            self.value = value
+
+        def exists(self) -> bool:
+            return True
+
+        def resolve(self) -> Path:
+            raise OSError("nope")
+
+        def __str__(self) -> str:
+            return self.value
+
+    monkeypatch.setattr(
+        cli, "LEGACY_CACHE_PATH", _LegacyPath(str(tmp_path / "legacy-cache.json"))
+    )
+    baseline = _write_baseline(
+        root / "baseline.json",
+        python_version=f"{sys.version_info.major}.{sys.version_info.minor}",
+    )
+    _patch_parallel(monkeypatch)
+    _run_main(
+        monkeypatch,
+        [str(root), "--baseline", str(baseline), "--no-progress"],
+    )
+    out = capsys.readouterr().out
+    assert "Legacy cache file found at" in out
+
+
+def test_cli_no_legacy_warning_with_cache_override(
+    tmp_path: Path, monkeypatch: pytest.MonkeyPatch, capsys: pytest.CaptureFixture[str]
+) -> None:
+    root = tmp_path / "proj"
+    root.mkdir()
+    (root / "a.py").write_text("def f():\n    return 1\n", "utf-8")
+    legacy_path = tmp_path / "legacy" / "cache.json"
+    legacy_path.parent.mkdir(parents=True, exist_ok=True)
+    legacy_path.write_text("{}", "utf-8")
+    monkeypatch.setattr(cli, "LEGACY_CACHE_PATH", legacy_path)
+    cache_path = tmp_path / "custom-cache.json"
+    _patch_parallel(monkeypatch)
+    _run_main(
+        monkeypatch,
+        [
+            str(root),
+            "--cache-dir",
+            str(cache_path),
+            "--no-progress",
+        ],
+    )
+    out = capsys.readouterr().out
+    assert "Legacy cache file found at" not in out
+
+
+def test_cli_no_legacy_warning_when_legacy_missing(
+    tmp_path: Path, monkeypatch: pytest.MonkeyPatch, capsys: pytest.CaptureFixture[str]
+) -> None:
+    root = tmp_path / "proj"
+    root.mkdir()
+    (root / "a.py").write_text("def f():\n    return 1\n", "utf-8")
+    missing_legacy = tmp_path / "missing" / "cache.json"
+    monkeypatch.setattr(cli, "LEGACY_CACHE_PATH", missing_legacy)
+    _patch_parallel(monkeypatch)
+    _run_main(monkeypatch, [str(root), "--no-progress"])
+    out = capsys.readouterr().out
+    assert "Legacy cache file found at" not in out
+
+
+def test_cli_no_legacy_warning_when_paths_match(
+    tmp_path: Path, monkeypatch: pytest.MonkeyPatch, capsys: pytest.CaptureFixture[str]
+) -> None:
+    root = tmp_path / "proj"
+    root.mkdir()
+    (root / "a.py").write_text("def f():\n    return 1\n", "utf-8")
+    cache_path = root / ".cache" / "codeclone" / "cache.json"
+
+    class _LegacyPathSame:
+        def __init__(self, resolved: Path) -> None:
+            self._resolved = resolved
+
+        def exists(self) -> bool:
+            return True
+
+        def resolve(self) -> Path:
+            return self._resolved
+
+        def __str__(self) -> str:
+            return str(self._resolved)
+
+    class _CacheStub:
+        def __init__(self, _path: Path, **_kwargs: object) -> None:
+            self.load_warning = None
+
+        def load(self) -> None:
+            return None
+
+        def get_file_entry(self, _fp: str) -> None:
+            return None
+
+        def put_file_entry(
+            self,
+            _fp: str,
+            _stat: object,
+            _units: object,
+            _blocks: object,
+            _segments: object,
+        ) -> None:
+            return None
+
+        def save(self) -> None:
+            return None
+
+    monkeypatch.setattr(cli, "LEGACY_CACHE_PATH", _LegacyPathSame(cache_path))
+    monkeypatch.setattr(cli, "Cache", _CacheStub)
+    _patch_parallel(monkeypatch)
+    _run_main(monkeypatch, [str(root), "--no-progress"])
+    out = capsys.readouterr().out
+    assert "Legacy cache file found at" not in out
 
 
 def test_cli_main_progress_fallback(
@@ -117,33 +618,49 @@ def test_cli_main_progress_fallback(
     assert "falling back to sequential" in out
 
 
-def test_cli_main_progress_path(
-    tmp_path: Path, monkeypatch: pytest.MonkeyPatch
+def test_cli_main_no_progress_fallback(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
 ) -> None:
     src = tmp_path / "a.py"
     src.write_text("def f():\n    return 1\n", "utf-8")
+    monkeypatch.setattr(cli, "ProcessPoolExecutor", _FailingExecutor)
+    _run_main(monkeypatch, [str(tmp_path), "--no-progress"])
+    out = capsys.readouterr().out
+    assert "falling back to sequential" in out
 
-    class _DummyProgress:
-        def __init__(self, *args: object, **kwargs: object) -> None:
-            return None
-
-        def __enter__(self) -> _DummyProgress:
-            return self
-
-        def __exit__(
-            self,
-            exc_type: type[BaseException] | None,
-            exc: BaseException | None,
-            tb: object | None,
-        ) -> Literal[False]:
-            return False
 
-        def add_task(self, _desc: str, total: int) -> int:
-            return total
+def test_cli_main_no_progress_fallback_quiet(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f():\n    return 1\n", "utf-8")
+    baseline = _write_baseline(
+        tmp_path / "baseline.json",
+        python_version=f"{sys.version_info.major}.{sys.version_info.minor}",
+    )
+    monkeypatch.setattr(cli, "ProcessPoolExecutor", _FailingExecutor)
+    _run_main(
+        monkeypatch,
+        [
+            str(tmp_path),
+            "--ci",
+            "--baseline",
+            str(baseline),
+        ],
+    )
+    out = capsys.readouterr().out
+    assert "Processing" not in out
 
-        def advance(self, _task: int) -> None:
-            return None
 
+def test_cli_main_progress_path(
+    tmp_path: Path, monkeypatch: pytest.MonkeyPatch
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f():\n    return 1\n", "utf-8")
     monkeypatch.setattr(cli, "Progress", _DummyProgress)
     _patch_parallel(monkeypatch)
     _run_main(monkeypatch, [str(tmp_path)])
@@ -159,17 +676,26 @@ def _boom(self: Path) -> Path:
     assert exc.value.code == 1
 
 
-def test_cli_main_outputs(tmp_path: Path, monkeypatch: pytest.MonkeyPatch) -> None:
+def test_cli_main_outputs(
+    tmp_path: Path, monkeypatch: pytest.MonkeyPatch, capsys: pytest.CaptureFixture[str]
+) -> None:
     src = tmp_path / "a.py"
     src.write_text("def f():\n    return 1\n", "utf-8")
     html_out = tmp_path / "out.html"
     json_out = tmp_path / "out.json"
     text_out = tmp_path / "out.txt"
+    baseline = tmp_path / "baseline.json"
+    _write_baseline(
+        baseline,
+        python_version=f"{sys.version_info.major}.{sys.version_info.minor}",
+    )
     _patch_parallel(monkeypatch)
     _run_main(
         monkeypatch,
         [
             str(tmp_path),
+            "--baseline",
+            str(baseline),
             "--html",
             str(html_out),
             "--json",
@@ -179,9 +705,785 @@ def test_cli_main_outputs(tmp_path: Path, monkeypatch: pytest.MonkeyPatch) -> No
             "--no-progress",
         ],
     )
-    assert html_out.exists()
-    assert json_out.exists()
-    assert text_out.exists()
+    assert html_out.exists()
+    assert json_out.exists()
+    assert text_out.exists()
+    out = capsys.readouterr().out
+    assert "HTML report saved:" in out
+    assert "JSON report saved:" in out
+    assert "Text report saved:" in out
+    assert out.index("Analysis Summary") < out.index("HTML report saved:")
+
+
+def test_cli_reports_include_audit_metadata_ok(
+    tmp_path: Path, monkeypatch: pytest.MonkeyPatch
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f():\n    return 1\n", "utf-8")
+    baseline_path = _write_baseline(
+        tmp_path / "baseline.json",
+        python_version=f"{sys.version_info.major}.{sys.version_info.minor}",
+    )
+    html_out = tmp_path / "report.html"
+    json_out = tmp_path / "report.json"
+    text_out = tmp_path / "report.txt"
+    _patch_parallel(monkeypatch)
+    _run_main(
+        monkeypatch,
+        [
+            str(tmp_path),
+            "--baseline",
+            str(baseline_path),
+            "--html",
+            str(html_out),
+            "--json",
+            str(json_out),
+            "--text",
+            str(text_out),
+            "--no-progress",
+        ],
+    )
+
+    payload = json.loads(json_out.read_text("utf-8"))
+    meta = payload["meta"]
+    assert meta["baseline_status"] == "ok"
+    assert meta["baseline_loaded"] is True
+    assert meta["baseline_version"] == __version__
+    assert meta["baseline_schema_version"] == BASELINE_SCHEMA_VERSION
+    assert meta["baseline_path"] == str(baseline_path.resolve())
+    assert "function_clones" in payload
+    assert "block_clones" in payload
+    assert "segment_clones" in payload
+
+    text = text_out.read_text("utf-8")
+    assert "REPORT METADATA" in text
+    assert "Baseline status: ok" in text
+    assert f"Baseline schema version: {BASELINE_SCHEMA_VERSION}" in text
+
+    html = html_out.read_text("utf-8")
+    assert "Report Provenance" in html
+    assert 'data-baseline-status="ok"' in html
+    assert "Baseline schema" in html
+
+
+def test_cli_reports_include_audit_metadata_missing_baseline(
+    tmp_path: Path, monkeypatch: pytest.MonkeyPatch
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f():\n    return 1\n", "utf-8")
+    json_out = tmp_path / "report.json"
+    _patch_parallel(monkeypatch)
+    _run_main(
+        monkeypatch,
+        [
+            str(tmp_path),
+            "--baseline",
+            str(tmp_path / "missing-baseline.json"),
+            "--json",
+            str(json_out),
+            "--no-progress",
+        ],
+    )
+    payload = json.loads(json_out.read_text("utf-8"))
+    meta = payload["meta"]
+    assert meta["baseline_status"] == "missing"
+    assert meta["baseline_loaded"] is False
+    assert meta["baseline_version"] is None
+    assert meta["baseline_schema_version"] is None
+
+
+def test_cli_reports_include_audit_metadata_version_mismatch(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f():\n    return 1\n", "utf-8")
+    baseline_path = _write_baseline(
+        tmp_path / "baseline.json",
+        python_version=f"{sys.version_info.major}.{sys.version_info.minor}",
+        baseline_version="0.0.0",
+    )
+    json_out = tmp_path / "report.json"
+    _patch_parallel(monkeypatch)
+    with pytest.raises(SystemExit) as exc:
+        _run_main(
+            monkeypatch,
+            [
+                str(tmp_path),
+                "--baseline",
+                str(baseline_path),
+                "--json",
+                str(json_out),
+                "--no-progress",
+            ],
+        )
+    assert exc.value.code == 2
+    out = capsys.readouterr().out
+    assert "Baseline version mismatch" in out
+    payload = json.loads(json_out.read_text("utf-8"))
+    meta = payload["meta"]
+    assert meta["baseline_status"] == "mismatch_version"
+    assert meta["baseline_loaded"] is True
+    assert meta["baseline_version"] == "0.0.0"
+
+
+def test_cli_reports_include_audit_metadata_schema_mismatch(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f():\n    return 1\n", "utf-8")
+    baseline_path = _write_baseline(
+        tmp_path / "baseline.json",
+        python_version=f"{sys.version_info.major}.{sys.version_info.minor}",
+        schema_version=999,
+    )
+    json_out = tmp_path / "report.json"
+    _patch_parallel(monkeypatch)
+    with pytest.raises(SystemExit) as exc:
+        _run_main(
+            monkeypatch,
+            [
+                str(tmp_path),
+                "--baseline",
+                str(baseline_path),
+                "--json",
+                str(json_out),
+                "--no-progress",
+            ],
+        )
+    assert exc.value.code == 2
+    out = capsys.readouterr().out
+    assert "Baseline schema version mismatch" in out
+    payload = json.loads(json_out.read_text("utf-8"))
+    meta = payload["meta"]
+    assert meta["baseline_status"] == "mismatch_schema"
+    assert meta["baseline_loaded"] is True
+    assert meta["baseline_schema_version"] == 999
+
+
+def test_cli_reports_include_audit_metadata_python_mismatch(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f():\n    return 1\n", "utf-8")
+    baseline_path = _write_baseline(
+        tmp_path / "baseline.json",
+        python_version="0.0",
+    )
+    json_out = tmp_path / "report.json"
+    _patch_parallel(monkeypatch)
+    with pytest.raises(SystemExit) as exc:
+        _run_main(
+            monkeypatch,
+            [
+                str(tmp_path),
+                "--baseline",
+                str(baseline_path),
+                "--fail-on-new",
+                "--json",
+                str(json_out),
+                "--no-progress",
+            ],
+        )
+    assert exc.value.code == 2
+    out = capsys.readouterr().out
+    assert "Baseline Python version mismatch" in out
+    assert "Baseline checks require the same Python version" in out
+    payload = json.loads(json_out.read_text("utf-8"))
+    meta = payload["meta"]
+    assert meta["baseline_status"] == "mismatch_python"
+    assert meta["baseline_loaded"] is True
+    assert meta["baseline_python_version"] == "0.0"
+
+
+def test_cli_reports_include_audit_metadata_invalid_baseline(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f():\n    return 1\n", "utf-8")
+    baseline_path = tmp_path / "baseline.json"
+    baseline_path.write_text("{broken json", "utf-8")
+    json_out = tmp_path / "report.json"
+    _patch_parallel(monkeypatch)
+    _run_main(
+        monkeypatch,
+        [
+            str(tmp_path),
+            "--baseline",
+            str(baseline_path),
+            "--json",
+            str(json_out),
+            "--no-progress",
+        ],
+    )
+    out = capsys.readouterr().out
+    assert "Invalid baseline file" in out
+    assert "Baseline is not trusted for this run and will be ignored" in out
+    payload = json.loads(json_out.read_text("utf-8"))
+    meta = payload["meta"]
+    assert meta["baseline_status"] == "invalid"
+    assert meta["baseline_loaded"] is False
+
+
+def test_cli_reports_include_audit_metadata_legacy_baseline(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f():\n    return 1\n", "utf-8")
+    baseline_path = tmp_path / "baseline.json"
+    baseline_path.write_text(
+        json.dumps({"functions": [], "blocks": [], "python_version": "3.13"}),
+        "utf-8",
+    )
+    json_out = tmp_path / "report.json"
+    _patch_parallel(monkeypatch)
+    with pytest.raises(SystemExit) as exc:
+        _run_main(
+            monkeypatch,
+            [
+                str(tmp_path),
+                "--baseline",
+                str(baseline_path),
+                "--json",
+                str(json_out),
+                "--no-progress",
+            ],
+        )
+    assert exc.value.code == 2
+    out = capsys.readouterr().out
+    assert "legacy baseline format" in out
+    assert "payload_sha256" not in out
+    payload = json.loads(json_out.read_text("utf-8"))
+    meta = payload["meta"]
+    assert meta["baseline_status"] == "legacy"
+    assert meta["baseline_loaded"] is True
+
+
+def test_cli_reports_include_audit_metadata_integrity_failed(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f():\n    return 1\n", "utf-8")
+    baseline_path = _write_baseline(
+        tmp_path / "baseline.json",
+        python_version=f"{sys.version_info.major}.{sys.version_info.minor}",
+        functions=["f1"],
+    )
+    tampered = json.loads(baseline_path.read_text("utf-8"))
+    tampered["functions"] = ["tampered"]
+    baseline_path.write_text(json.dumps(tampered), "utf-8")
+
+    json_out = tmp_path / "report.json"
+    _patch_parallel(monkeypatch)
+    _run_main(
+        monkeypatch,
+        [
+            str(tmp_path),
+            "--baseline",
+            str(baseline_path),
+            "--json",
+            str(json_out),
+            "--no-progress",
+        ],
+    )
+    out = capsys.readouterr().out
+    assert "integrity check failed" in out
+    assert "Baseline is not trusted for this run and will be ignored" in out
+    payload = json.loads(json_out.read_text("utf-8"))
+    meta = payload["meta"]
+    assert meta["baseline_status"] == "integrity_failed"
+    assert meta["baseline_loaded"] is False
+
+
+def test_cli_reports_include_audit_metadata_generator_mismatch(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f():\n    return 1\n", "utf-8")
+    baseline_path = _write_baseline(
+        tmp_path / "baseline.json",
+        python_version=f"{sys.version_info.major}.{sys.version_info.minor}",
+        generator="not-codeclone",
+    )
+    json_out = tmp_path / "report.json"
+    _patch_parallel(monkeypatch)
+    _run_main(
+        monkeypatch,
+        [
+            str(tmp_path),
+            "--baseline",
+            str(baseline_path),
+            "--json",
+            str(json_out),
+            "--no-progress",
+        ],
+    )
+    out = capsys.readouterr().out
+    assert "generator mismatch" in out
+    assert "Baseline is not trusted for this run and will be ignored" in out
+    payload = json.loads(json_out.read_text("utf-8"))
+    meta = payload["meta"]
+    assert meta["baseline_status"] == "generator_mismatch"
+    assert meta["baseline_loaded"] is False
+
+
+@pytest.mark.parametrize(
+    ("field", "bad_value", "expected_message", "expected_status"),
+    [
+        ("generator", 123, "generator mismatch", "generator_mismatch"),
+        (
+            "payload_sha256",
+            1,
+            "integrity payload hash is missing",
+            "integrity_missing",
+        ),
+    ],
+)
+def test_cli_reports_include_audit_metadata_integrity_field_type_errors(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+    field: str,
+    bad_value: object,
+    expected_message: str,
+    expected_status: str,
+) -> None:
+    _assert_baseline_failure_meta(
+        tmp_path=tmp_path,
+        monkeypatch=monkeypatch,
+        capsys=capsys,
+        mutate_payload=lambda payload: payload.__setitem__(field, bad_value),
+        expected_message=expected_message,
+        expected_status=expected_status,
+    )
+
+
+def test_cli_reports_include_audit_metadata_integrity_missing(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f():\n    return 1\n", "utf-8")
+    baseline_path = tmp_path / "baseline.json"
+    payload = _baseline_payload(
+        python_version=f"{sys.version_info.major}.{sys.version_info.minor}",
+    )
+    del payload["payload_sha256"]
+    baseline_path.write_text(json.dumps(payload), "utf-8")
+    json_out = tmp_path / "report.json"
+    _patch_parallel(monkeypatch)
+    _run_main(
+        monkeypatch,
+        [
+            str(tmp_path),
+            "--baseline",
+            str(baseline_path),
+            "--json",
+            str(json_out),
+            "--no-progress",
+        ],
+    )
+    out = capsys.readouterr().out
+    assert "integrity payload hash is missing" in out
+    assert "Baseline is not trusted for this run and will be ignored" in out
+    payload_out = json.loads(json_out.read_text("utf-8"))
+    meta = payload_out["meta"]
+    assert meta["baseline_status"] == "integrity_missing"
+    assert meta["baseline_loaded"] is False
+
+
+def test_cli_reports_include_audit_metadata_baseline_too_large(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f():\n    return 1\n", "utf-8")
+    baseline_path = _write_baseline(tmp_path / "baseline.json")
+    json_out = tmp_path / "report.json"
+    _patch_parallel(monkeypatch)
+    _run_main(
+        monkeypatch,
+        [
+            str(tmp_path),
+            "--baseline",
+            str(baseline_path),
+            "--max-baseline-size-mb",
+            "0",
+            "--json",
+            str(json_out),
+            "--no-progress",
+        ],
+    )
+    out = capsys.readouterr().out
+    assert "too large" in out
+    assert "Baseline is not trusted for this run and will be ignored" in out
+    payload = json.loads(json_out.read_text("utf-8"))
+    meta = payload["meta"]
+    assert meta["baseline_status"] == "too_large"
+    assert meta["baseline_loaded"] is False
+
+
+def test_cli_untrusted_baseline_ignored_for_diff(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text(
+        """
+def f1():
+    return 1
+
+def f2():
+    return 1
+""",
+        "utf-8",
+    )
+    baseline_path = tmp_path / "baseline.json"
+    _patch_parallel(monkeypatch)
+    _run_main(
+        monkeypatch,
+        [
+            str(tmp_path),
+            "--baseline",
+            str(baseline_path),
+            "--update-baseline",
+            "--min-loc",
+            "1",
+            "--min-stmt",
+            "1",
+            "--no-progress",
+        ],
+    )
+    capsys.readouterr()
+
+    payload = json.loads(baseline_path.read_text("utf-8"))
+    payload["generator"] = "not-codeclone"
+    baseline_path.write_text(json.dumps(payload), "utf-8")
+    json_out = tmp_path / "report.json"
+    _run_main(
+        monkeypatch,
+        [
+            str(tmp_path),
+            "--baseline",
+            str(baseline_path),
+            "--json",
+            str(json_out),
+            "--min-loc",
+            "1",
+            "--min-stmt",
+            "1",
+            "--no-progress",
+        ],
+    )
+    out = capsys.readouterr().out
+    assert "Baseline is not trusted for this run and will be ignored" in out
+    assert _summary_metric(out, "New vs baseline") > 0
+    report = json.loads(json_out.read_text("utf-8"))
+    assert report["meta"]["baseline_status"] == "generator_mismatch"
+    assert report["meta"]["baseline_loaded"] is False
+
+
+@pytest.mark.parametrize(
+    ("field", "bad_value", "expected_message", "expected_status"),
+    [
+        ("generator", "not-codeclone", "generator mismatch", "generator_mismatch"),
+        (
+            "payload_sha256",
+            "00",
+            "integrity check failed",
+            "integrity_failed",
+        ),
+        (
+            "payload_sha256",
+            None,
+            "integrity payload hash is missing",
+            "integrity_missing",
+        ),
+    ],
+)
+def test_cli_untrusted_baseline_fails_in_ci(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+    field: str,
+    bad_value: object,
+    expected_message: str,
+    expected_status: str,
+) -> None:
+    def _mutate(payload: dict[str, object]) -> None:
+        if bad_value is None:
+            payload.pop(field, None)
+        else:
+            payload[field] = bad_value
+
+    _assert_baseline_failure_meta(
+        tmp_path=tmp_path,
+        monkeypatch=monkeypatch,
+        capsys=capsys,
+        mutate_payload=_mutate,
+        expected_message=expected_message,
+        expected_status=expected_status,
+        strict_fail=True,
+    )
+
+
+def test_cli_invalid_baseline_fails_in_ci(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f():\n    return 1\n", "utf-8")
+    baseline_path = tmp_path / "baseline.json"
+    baseline_path.write_text("{broken json", "utf-8")
+    json_out = tmp_path / "report.json"
+    _patch_parallel(monkeypatch)
+    with pytest.raises(SystemExit) as exc:
+        _run_main(
+            monkeypatch,
+            [
+                str(tmp_path),
+                "--baseline",
+                str(baseline_path),
+                "--json",
+                str(json_out),
+                "--ci",
+                "--no-progress",
+            ],
+        )
+    assert exc.value.code == 2
+    out = capsys.readouterr().out
+    assert "Invalid baseline file" in out
+    payload = json.loads(json_out.read_text("utf-8"))
+    assert payload["meta"]["baseline_status"] == "invalid"
+    assert payload["meta"]["baseline_loaded"] is False
+
+
+def test_cli_too_large_baseline_fails_in_ci(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f():\n    return 1\n", "utf-8")
+    baseline_path = _write_baseline(tmp_path / "baseline.json")
+    json_out = tmp_path / "report.json"
+    _patch_parallel(monkeypatch)
+    with pytest.raises(SystemExit) as exc:
+        _run_main(
+            monkeypatch,
+            [
+                str(tmp_path),
+                "--baseline",
+                str(baseline_path),
+                "--max-baseline-size-mb",
+                "0",
+                "--json",
+                str(json_out),
+                "--ci",
+                "--no-progress",
+            ],
+        )
+    assert exc.value.code == 2
+    out = capsys.readouterr().out
+    assert "too large" in out
+    payload = json.loads(json_out.read_text("utf-8"))
+    assert payload["meta"]["baseline_status"] == "too_large"
+    assert payload["meta"]["baseline_loaded"] is False
+
+
+def test_cli_reports_cache_used_false_on_warning(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f():\n    return 1\n", "utf-8")
+    cache_path = tmp_path / "cache.json"
+    cache = Cache(cache_path)
+    cache.put_file_entry(str(src), {"mtime_ns": 1, "size": 10}, [], [], [])
+    cache.save()
+    data = json.loads(cache_path.read_text("utf-8"))
+    data["_signature"] = "bad"
+    cache_path.write_text(json.dumps(data), "utf-8")
+
+    baseline_path = _write_baseline(
+        tmp_path / "baseline.json",
+        python_version=f"{sys.version_info.major}.{sys.version_info.minor}",
+    )
+    json_out = tmp_path / "report.json"
+    _patch_parallel(monkeypatch)
+    _run_main(
+        monkeypatch,
+        [
+            str(tmp_path),
+            "--baseline",
+            str(baseline_path),
+            "--cache-dir",
+            str(cache_path),
+            "--json",
+            str(json_out),
+            "--no-progress",
+        ],
+    )
+    out = capsys.readouterr().out
+    assert "signature" in out
+    payload = json.loads(json_out.read_text("utf-8"))
+    meta = payload["meta"]
+    assert meta["cache_used"] is False
+
+
+def test_cli_reports_cache_too_large_respects_max_size_flag(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f():\n    return 1\n", "utf-8")
+    cache_path = tmp_path / "cache.json"
+    cache_path.write_text("{}", "utf-8")
+
+    baseline_path = _write_baseline(
+        tmp_path / "baseline.json",
+        python_version=f"{sys.version_info.major}.{sys.version_info.minor}",
+    )
+    json_out = tmp_path / "report.json"
+    _patch_parallel(monkeypatch)
+    _run_main(
+        monkeypatch,
+        [
+            str(tmp_path),
+            "--baseline",
+            str(baseline_path),
+            "--cache-path",
+            str(cache_path),
+            "--max-cache-size-mb",
+            "0",
+            "--json",
+            str(json_out),
+            "--no-progress",
+        ],
+    )
+    out = capsys.readouterr().out
+    assert "Cache file too large" in out
+    payload = json.loads(json_out.read_text("utf-8"))
+    meta = payload["meta"]
+    assert meta["cache_used"] is False
+
+
+@pytest.mark.parametrize(
+    ("flag", "bad_name", "label", "expected"),
+    [
+        ("--html", "report.exe", "HTML", ".html"),
+        ("--json", "report.txt", "JSON", ".json"),
+        ("--text", "report.json", "text", ".txt"),
+    ],
+)
+def test_cli_output_extension_validation(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+    flag: str,
+    bad_name: str,
+    label: str,
+    expected: str,
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f():\n    return 1\n", "utf-8")
+    bad_path = tmp_path / bad_name
+    with pytest.raises(SystemExit) as exc:
+        _run_main(
+            monkeypatch,
+            [
+                str(tmp_path),
+                flag,
+                str(bad_path),
+            ],
+        )
+    assert exc.value.code == 2
+    out = capsys.readouterr().out
+    assert f"Invalid {label} output extension" in out
+    assert expected in out
+
+
+def test_cli_outputs_quiet_no_print(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f():\n    return 1\n", "utf-8")
+    html_out = tmp_path / "out.html"
+    json_out = tmp_path / "out.json"
+    text_out = tmp_path / "out.txt"
+    baseline = _write_baseline(
+        tmp_path / "baseline.json",
+        python_version=f"{sys.version_info.major}.{sys.version_info.minor}",
+    )
+    _patch_parallel(monkeypatch)
+    _run_main(
+        monkeypatch,
+        [
+            str(tmp_path),
+            "--ci",
+            "--baseline",
+            str(baseline),
+            "--html",
+            str(html_out),
+            "--json",
+            str(json_out),
+            "--text",
+            str(text_out),
+        ],
+    )
+    assert html_out.exists()
+    assert json_out.exists()
+    assert text_out.exists()
+    out = capsys.readouterr().out
+    assert "report saved" not in out
+
+
+def test_cli_update_baseline_skips_version_check(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f():\n    return 1\n", "utf-8")
+    baseline_path = _write_baseline(
+        tmp_path / "baseline.json",
+        python_version=f"{sys.version_info.major}.{sys.version_info.minor}",
+        baseline_version="0.0.0",
+    )
+    _patch_parallel(monkeypatch)
+    _run_main(
+        monkeypatch,
+        [
+            str(tmp_path),
+            "--baseline",
+            str(baseline_path),
+            "--update-baseline",
+            "--no-progress",
+        ],
+    )
+    out = capsys.readouterr().out
+    assert "Baseline updated" in out
 
 
 def test_cli_update_baseline(
@@ -221,6 +1523,34 @@ def f2():
     assert baseline.exists()
 
 
+def test_cli_update_baseline_with_invalid_existing_file(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f():\n    return 1\n", "utf-8")
+    baseline_path = tmp_path / "baseline.json"
+    baseline_path.write_text("{broken json", "utf-8")
+    _patch_parallel(monkeypatch)
+    _run_main(
+        monkeypatch,
+        [
+            str(tmp_path),
+            "--baseline",
+            str(baseline_path),
+            "--update-baseline",
+            "--no-progress",
+        ],
+    )
+    out = capsys.readouterr().out
+    assert "Baseline updated" in out
+    assert "Invalid baseline file" not in out
+    payload = json.loads(baseline_path.read_text("utf-8"))
+    assert payload.get("baseline_version") == __version__
+    assert payload.get("schema_version") == BASELINE_SCHEMA_VERSION
+
+
 def test_cli_baseline_missing_warning(
     tmp_path: Path,
     monkeypatch: pytest.MonkeyPatch,
@@ -256,11 +1586,11 @@ def f1():
 
 def f2():
     return 1
-""",
+    """,
         "utf-8",
     )
     baseline = tmp_path / "baseline.json"
-    baseline.write_text('{"functions": [], "blocks": []}', "utf-8")
+    _write_baseline(baseline)
     _patch_parallel(monkeypatch)
     _run_main(
         monkeypatch,
@@ -287,9 +1617,7 @@ def test_cli_baseline_python_version_mismatch_warns(
     src = tmp_path / "a.py"
     src.write_text("def f():\n    return 1\n", "utf-8")
     baseline = tmp_path / "baseline.json"
-    baseline.write_text(
-        '{"functions": [], "blocks": [], "python_version": "0.0"}', "utf-8"
-    )
+    _write_baseline(baseline, python_version="0.0")
     _patch_parallel(monkeypatch)
     _run_main(
         monkeypatch,
@@ -305,6 +1633,168 @@ def test_cli_baseline_python_version_mismatch_warns(
     assert "Current interpreter: Python" in out
 
 
+def test_cli_baseline_version_mismatch_fails(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f():\n    return 1\n", "utf-8")
+    baseline_path = tmp_path / "baseline.json"
+    _write_baseline(
+        baseline_path,
+        python_version=f"{sys.version_info.major}.{sys.version_info.minor}",
+        baseline_version="0.0.0",
+    )
+    _patch_parallel(monkeypatch)
+    with pytest.raises(SystemExit) as exc:
+        _run_main(
+            monkeypatch,
+            [
+                str(tmp_path),
+                "--baseline",
+                str(baseline_path),
+                "--no-progress",
+            ],
+        )
+    assert exc.value.code == 2
+    out = capsys.readouterr().out
+    assert "Baseline version mismatch" in out
+
+
+def test_cli_baseline_version_missing_fails(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f():\n    return 1\n", "utf-8")
+    baseline_path = tmp_path / "baseline.json"
+    baseline_path.write_text(
+        json.dumps(
+            {
+                "functions": [],
+                "blocks": [],
+                "python_version": f"{sys.version_info.major}.{sys.version_info.minor}",
+                "schema_version": BASELINE_SCHEMA_VERSION,
+            }
+        ),
+        "utf-8",
+    )
+    _patch_parallel(monkeypatch)
+    with pytest.raises(SystemExit) as exc:
+        _run_main(
+            monkeypatch,
+            [
+                str(tmp_path),
+                "--baseline",
+                str(baseline_path),
+                "--no-progress",
+            ],
+        )
+    assert exc.value.code == 2
+    out = capsys.readouterr().out
+    assert "Baseline version missing" in out
+
+
+def test_cli_baseline_schema_version_mismatch_fails(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f():\n    return 1\n", "utf-8")
+    baseline_path = tmp_path / "baseline.json"
+    _write_baseline(
+        baseline_path,
+        python_version=f"{sys.version_info.major}.{sys.version_info.minor}",
+        schema_version=999,
+    )
+    _patch_parallel(monkeypatch)
+    with pytest.raises(SystemExit) as exc:
+        _run_main(
+            monkeypatch,
+            [
+                str(tmp_path),
+                "--baseline",
+                str(baseline_path),
+                "--no-progress",
+            ],
+        )
+    assert exc.value.code == 2
+    out = capsys.readouterr().out
+    assert "Baseline schema version mismatch" in out
+
+
+def test_cli_baseline_version_and_schema_mismatch_status_prefers_version(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f():\n    return 1\n", "utf-8")
+    baseline_path = _write_baseline(
+        tmp_path / "baseline.json",
+        python_version=f"{sys.version_info.major}.{sys.version_info.minor}",
+        baseline_version="0.0.0",
+        schema_version=999,
+    )
+    json_out = tmp_path / "report.json"
+    _patch_parallel(monkeypatch)
+    with pytest.raises(SystemExit) as exc:
+        _run_main(
+            monkeypatch,
+            [
+                str(tmp_path),
+                "--baseline",
+                str(baseline_path),
+                "--json",
+                str(json_out),
+                "--no-progress",
+            ],
+        )
+    assert exc.value.code == 2
+    out = capsys.readouterr().out
+    assert "Baseline version mismatch" in out
+    assert "Baseline schema version mismatch" in out
+    payload = json.loads(json_out.read_text("utf-8"))
+    assert payload["meta"]["baseline_status"] == "mismatch_version"
+
+
+def test_cli_baseline_version_and_python_mismatch_status_prefers_version(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f():\n    return 1\n", "utf-8")
+    baseline_path = _write_baseline(
+        tmp_path / "baseline.json",
+        python_version="0.0",
+        baseline_version="0.0.0",
+    )
+    json_out = tmp_path / "report.json"
+    _patch_parallel(monkeypatch)
+    with pytest.raises(SystemExit) as exc:
+        _run_main(
+            monkeypatch,
+            [
+                str(tmp_path),
+                "--baseline",
+                str(baseline_path),
+                "--json",
+                str(json_out),
+                "--no-progress",
+            ],
+        )
+    assert exc.value.code == 2
+    out = capsys.readouterr().out
+    assert "Baseline version mismatch" in out
+    assert "Baseline Python version mismatch" in out
+    payload = json.loads(json_out.read_text("utf-8"))
+    assert payload["meta"]["baseline_status"] == "mismatch_version"
+
+
 def test_cli_baseline_python_version_mismatch_fails(
     tmp_path: Path,
     monkeypatch: pytest.MonkeyPatch,
@@ -313,9 +1803,7 @@ def test_cli_baseline_python_version_mismatch_fails(
     src = tmp_path / "a.py"
     src.write_text("def f():\n    return 1\n", "utf-8")
     baseline = tmp_path / "baseline.json"
-    baseline.write_text(
-        '{"functions": [], "blocks": [], "python_version": "0.0"}', "utf-8"
-    )
+    _write_baseline(baseline, python_version="0.0")
     _patch_parallel(monkeypatch)
     with pytest.raises(SystemExit) as exc:
         _run_main(
@@ -333,6 +1821,16 @@ def test_cli_baseline_python_version_mismatch_fails(
     assert "Baseline checks require the same Python version" in out
 
 
+def test_cli_negative_size_limits_fail_fast(
+    monkeypatch: pytest.MonkeyPatch, capsys: pytest.CaptureFixture[str]
+) -> None:
+    with pytest.raises(SystemExit) as exc:
+        _run_main(monkeypatch, ["--max-baseline-size-mb", "-1"])
+    assert exc.value.code == 1
+    out = capsys.readouterr().out
+    assert "non-negative integers" in out
+
+
 def test_cli_main_fail_threshold(
     tmp_path: Path, monkeypatch: pytest.MonkeyPatch
 ) -> None:
@@ -378,16 +1876,49 @@ def f2():
         "utf-8",
     )
     baseline = tmp_path / "baseline.json"
-    baseline.write_text(
-        json.dumps(
-            {
-                "functions": [],
-                "blocks": [],
-                "python_version": f"{sys.version_info.major}.{sys.version_info.minor}",
-            }
-        ),
+    _write_baseline(
+        baseline,
+        python_version=f"{sys.version_info.major}.{sys.version_info.minor}",
+    )
+    _patch_parallel(monkeypatch)
+    with pytest.raises(SystemExit) as exc:
+        _run_main(
+            monkeypatch,
+            [
+                str(tmp_path),
+                "--baseline",
+                str(baseline),
+                "--min-loc",
+                "1",
+                "--min-stmt",
+                "1",
+                "--fail-on-new",
+                "--no-progress",
+            ],
+        )
+    assert exc.value.code == 3
+
+
+def test_cli_main_fail_on_new_includes_blocks(
+    tmp_path: Path, monkeypatch: pytest.MonkeyPatch, capsys: pytest.CaptureFixture[str]
+) -> None:
+    body = "\n".join([f"    x{i} = {i}" for i in range(50)])
+    src = tmp_path / "a.py"
+    src.write_text(
+        f"""
+def f1():
+{body}
+
+def f2():
+{body}
+    """,
         "utf-8",
     )
+    baseline = tmp_path / "baseline.json"
+    _write_baseline(
+        baseline,
+        python_version=f"{sys.version_info.major}.{sys.version_info.minor}",
+    )
     _patch_parallel(monkeypatch)
     with pytest.raises(SystemExit) as exc:
         _run_main(
@@ -405,6 +1936,48 @@ def f2():
             ],
         )
     assert exc.value.code == 3
+    out = capsys.readouterr().out
+    _assert_fail_on_new_summary(out)
+
+
+def test_cli_ci_preset_fails_on_new(
+    tmp_path: Path, monkeypatch: pytest.MonkeyPatch, capsys: pytest.CaptureFixture[str]
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text(
+        """
+def f1():
+    return 1
+
+def f2():
+    return 1
+    """,
+        "utf-8",
+    )
+    baseline = tmp_path / "baseline.json"
+    _write_baseline(
+        baseline,
+        python_version=f"{sys.version_info.major}.{sys.version_info.minor}",
+    )
+    _patch_parallel(monkeypatch)
+    with pytest.raises(SystemExit) as exc:
+        _run_main(
+            monkeypatch,
+            [
+                str(tmp_path),
+                "--baseline",
+                str(baseline),
+                "--min-loc",
+                "1",
+                "--min-stmt",
+                "1",
+                "--ci",
+            ],
+        )
+    assert exc.value.code == 3
+    out = capsys.readouterr().out
+    _assert_fail_on_new_summary(out, include_blocks=False)
+    assert "CodeClone v" not in out
 
 
 def test_cli_blocks_processing(tmp_path: Path, monkeypatch: pytest.MonkeyPatch) -> None:
@@ -427,7 +2000,7 @@ def test_cli_cache_warning(
     src.write_text("def f():\n    return 1\n", "utf-8")
     cache_path = tmp_path / "cache.json"
     cache = Cache(cache_path)
-    cache.put_file_entry("x.py", {"mtime_ns": 1, "size": 1}, [], [])
+    cache.put_file_entry("x.py", {"mtime_ns": 1, "size": 1}, [], [], [])
     cache.save()
     data = json.loads(cache_path.read_text("utf-8"))
     data["_signature"] = "bad"
@@ -464,7 +2037,38 @@ def _raise_save(self: Cache) -> None:
         monkeypatch,
         [
             str(tmp_path),
-            "--no-progress",
+            "--no-progress",
+        ],
+    )
+    out = capsys.readouterr().out
+    assert "Failed to save cache" in out
+
+
+def test_cli_cache_save_warning_quiet(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f():\n    return 1\n", "utf-8")
+    baseline_path = tmp_path / "baseline.json"
+    _write_baseline(
+        baseline_path,
+        python_version=f"{sys.version_info.major}.{sys.version_info.minor}",
+    )
+
+    def _raise_save(self: Cache) -> None:
+        raise CacheError("nope")
+
+    monkeypatch.setattr(Cache, "save", _raise_save)
+    _patch_parallel(monkeypatch)
+    _run_main(
+        monkeypatch,
+        [
+            str(tmp_path),
+            "--ci",
+            "--baseline",
+            str(baseline_path),
         ],
     )
     out = capsys.readouterr().out
@@ -501,6 +2105,7 @@ def test_cli_discovery_cache_hit(
             }
         ],
         "blocks": [],
+        "segments": [],
     }
     cache.save()
 
@@ -515,13 +2120,22 @@ def test_cli_discovery_cache_hit(
         ],
     )
     out = capsys.readouterr().out
-    assert "Files Processed" in out
+    files_found = _summary_metric(out, "Files found")
+    files_analyzed = _summary_metric(out, "Files analyzed")
+    cache_hits = _summary_metric(out, "Cache hits")
+    files_skipped = _summary_metric(out, "Files skipped")
+    assert files_found > 0
+    assert cache_hits == files_found
+    assert files_analyzed == 0
+    assert files_found == files_analyzed + cache_hits + files_skipped
 
 
+@pytest.mark.parametrize("extra_args", [["--no-progress"], ["--ci"]])
 def test_cli_discovery_skip_oserror(
     tmp_path: Path,
     monkeypatch: pytest.MonkeyPatch,
     capsys: pytest.CaptureFixture[str],
+    extra_args: list[str],
 ) -> None:
     src = tmp_path / "a.py"
     src.write_text("def f():\n    return 1\n", "utf-8")
@@ -531,9 +2145,135 @@ def _bad_stat(_path: str) -> dict[str, int]:
 
     monkeypatch.setattr(cli, "file_stat_signature", _bad_stat)
     _patch_parallel(monkeypatch)
-    _run_main(monkeypatch, [str(tmp_path), "--no-progress"])
+    args = [str(tmp_path), *extra_args]
+    if "--ci" in extra_args:
+        baseline = _write_baseline(
+            tmp_path / "baseline.json",
+            python_version=f"{sys.version_info.major}.{sys.version_info.minor}",
+        )
+        args.extend(["--baseline", str(baseline)])
+    _run_main(monkeypatch, args)
     out = capsys.readouterr().out
     assert "Skipping file" in out
+    if "--ci" in extra_args:
+        files_found = _compact_summary_metric(out, "found")
+        files_analyzed = _compact_summary_metric(out, "analyzed")
+        cache_hits = _compact_summary_metric(out, "cache_hits")
+        files_skipped = _compact_summary_metric(out, "skipped")
+    else:
+        files_found = _summary_metric(out, "Files found")
+        files_analyzed = _summary_metric(out, "Files analyzed")
+        cache_hits = _summary_metric(out, "Cache hits")
+        files_skipped = _summary_metric(out, "Files skipped")
+    assert files_found == files_analyzed + cache_hits + files_skipped
+
+
+def test_cli_ci_discovery_cache_hit(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f():\n    return 1\n", "utf-8")
+    cache_path = tmp_path / "cache.json"
+    cache = Cache(cache_path)
+    stat = file_stat_signature(str(src))
+    cache.put_file_entry(
+        str(src),
+        stat,
+        [],
+        [],
+        [],
+    )
+    cache.save()
+    baseline = tmp_path / "baseline.json"
+    _write_baseline(
+        baseline,
+        python_version=f"{sys.version_info.major}.{sys.version_info.minor}",
+    )
+    _patch_parallel(monkeypatch)
+    _run_main(
+        monkeypatch,
+        [
+            str(tmp_path),
+            "--ci",
+            "--cache-dir",
+            str(cache_path),
+            "--baseline",
+            str(baseline),
+        ],
+    )
+    out = capsys.readouterr().out
+    assert "CodeClone v" not in out
+    assert "Analysis Summary" in out
+    assert "Analyzing" not in out
+    assert "\x1b[" not in out
+    assert "new_vs_baseline=" in out
+    assert _compact_summary_metric(out, "found") == 1
+    assert _compact_summary_metric(out, "analyzed") == 0
+    assert _compact_summary_metric(out, "cache_hits") == 1
+    assert _compact_summary_metric(out, "skipped") == 0
+
+
+def test_cli_summary_cache_miss_metrics(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f():\n    return 1\n", "utf-8")
+    _patch_parallel(monkeypatch)
+    _run_main(monkeypatch, [str(tmp_path), "--no-progress"])
+    out = capsys.readouterr().out
+    files_found = _summary_metric(out, "Files found")
+    files_analyzed = _summary_metric(out, "Files analyzed")
+    cache_hits = _summary_metric(out, "Cache hits")
+    files_skipped = _summary_metric(out, "Files skipped")
+    assert files_found > 0
+    assert files_analyzed == files_found
+    assert cache_hits == 0
+    assert files_skipped == 0
+    assert files_found == files_analyzed + cache_hits + files_skipped
+
+
+def test_cli_summary_format_stable(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f():\n    return 1\n", "utf-8")
+    _patch_parallel(monkeypatch)
+    _run_main(monkeypatch, [str(tmp_path), "--no-progress"])
+    out = capsys.readouterr().out
+    assert "Analysis Summary" in out
+    assert out.count("Analysis Summary") == 1
+    assert out.count("Metric") == 1
+    assert out.count("Value") == 1
+    assert "Files parsed" not in out
+    assert "Input" not in out
+    assert _summary_metric(out, "Files found") >= 0
+    assert _summary_metric(out, "Files analyzed") >= 0
+    assert _summary_metric(out, "Cache hits") >= 0
+    assert _summary_metric(out, "Files skipped") >= 0
+    assert _summary_metric(out, "Function clone groups") >= 0
+    assert _summary_metric(out, "Block clone groups") >= 0
+    assert _summary_metric(out, "Segment clone groups") >= 0
+    assert _summary_metric(out, "Suppressed segment groups") >= 0
+    assert _summary_metric(out, "New vs baseline") >= 0
+
+
+def test_cli_summary_no_color_has_no_ansi(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f():\n    return 1\n", "utf-8")
+    _patch_parallel(monkeypatch)
+    _run_main(monkeypatch, [str(tmp_path), "--no-progress", "--no-color"])
+    out = capsys.readouterr().out
+    assert "\x1b[" not in out
 
 
 def test_cli_scan_failed(tmp_path: Path, monkeypatch: pytest.MonkeyPatch) -> None:
@@ -567,6 +2307,27 @@ def _bad_process(
     assert "and 2 more" in out
 
 
+def test_cli_failed_files_report_single(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f():\n    return 1\n", "utf-8")
+
+    def _bad_process(
+        _fp: str, *_args: object, **_kwargs: object
+    ) -> cli.ProcessingResult:
+        return cli.ProcessingResult(filepath=_fp, success=False, error="bad")
+
+    monkeypatch.setattr(cli, "process_file", _bad_process)
+    _patch_parallel(monkeypatch)
+    _run_main(monkeypatch, [str(tmp_path), "--no-progress"])
+    out = capsys.readouterr().out
+    assert "files failed to process" in out
+    assert "and 1 more" not in out
+
+
 def test_cli_worker_failed(
     tmp_path: Path,
     monkeypatch: pytest.MonkeyPatch,
@@ -611,27 +2372,6 @@ def __exit__(
         ) -> Literal[False]:
             return False
 
-    class _DummyProgress:
-        def __init__(self, *args: object, **kwargs: object) -> None:
-            return None
-
-        def __enter__(self) -> _DummyProgress:
-            return self
-
-        def __exit__(
-            self,
-            exc_type: type[BaseException] | None,
-            exc: BaseException | None,
-            tb: object | None,
-        ) -> Literal[False]:
-            return False
-
-        def add_task(self, _desc: str, total: int) -> int:
-            return total
-
-        def advance(self, _task: int) -> None:
-            return None
-
     monkeypatch.setattr(cli, "Progress", _DummyProgress)
     monkeypatch.setattr(cli, "ProcessPoolExecutor", _FailExec)
     monkeypatch.setattr(cli, "process_file", _boom)
@@ -688,15 +2428,9 @@ def _diff(
 
     monkeypatch.setattr(baseline.Baseline, "diff", _diff)
     baseline_path = tmp_path / "baseline.json"
-    baseline_path.write_text(
-        json.dumps(
-            {
-                "functions": [],
-                "blocks": [],
-                "python_version": f"{sys.version_info.major}.{sys.version_info.minor}",
-            }
-        ),
-        "utf-8",
+    _write_baseline(
+        baseline_path,
+        python_version=f"{sys.version_info.major}.{sys.version_info.minor}",
     )
     _patch_parallel(monkeypatch)
     with pytest.raises(SystemExit) as exc:
@@ -712,11 +2446,10 @@ def _diff(
         )
     assert exc.value.code == 3
     out = capsys.readouterr().out
-    assert "New Functions" in out
-    assert "New Blocks" in out
+    _assert_fail_on_new_summary(out)
 
 
-def test_cli_failed_batch_item_no_progress(
+def test_cli_fail_on_new_no_report_path(
     tmp_path: Path,
     monkeypatch: pytest.MonkeyPatch,
     capsys: pytest.CaptureFixture[str],
@@ -724,89 +2457,220 @@ def test_cli_failed_batch_item_no_progress(
     src = tmp_path / "a.py"
     src.write_text("def f():\n    return 1\n", "utf-8")
 
-    class _Future:
-        def result(self) -> cli.ProcessingResult:
-            raise RuntimeError("boom")
+    def _diff(
+        _self: object, _f: dict[str, object], _b: dict[str, object]
+    ) -> tuple[set[str], set[str]]:
+        return {"f1"}, {"b1"}
 
-    class _Exec:
-        def __init__(self, *args: object, **kwargs: object) -> None:
-            return None
+    monkeypatch.setattr(baseline.Baseline, "diff", _diff)
+    baseline_path = _write_baseline(
+        tmp_path / "baseline.json",
+        python_version=f"{sys.version_info.major}.{sys.version_info.minor}",
+    )
+    monkeypatch.chdir(tmp_path)
+    _patch_parallel(monkeypatch)
+    with pytest.raises(SystemExit) as exc:
+        _run_main(
+            monkeypatch,
+            [
+                str(tmp_path),
+                "--baseline",
+                str(baseline_path),
+                "--fail-on-new",
+                "--no-progress",
+            ],
+        )
+    assert exc.value.code == 3
+    out = capsys.readouterr().out
+    assert "See detailed report:" not in out
 
-        def __enter__(self) -> _Exec:
-            return self
 
-        def __exit__(
-            self,
-            exc_type: type[BaseException] | None,
-            exc: BaseException | None,
-            tb: object | None,
-        ) -> Literal[False]:
-            return False
+@pytest.mark.parametrize(
+    ("new_func", "new_block", "expect_func", "expect_block"),
+    [
+        ({"f1"}, set(), True, False),
+        (set(), {"b1"}, False, True),
+    ],
+)
+def test_cli_fail_on_new_verbose_single_kind(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+    new_func: set[str],
+    new_block: set[str],
+    expect_func: bool,
+    expect_block: bool,
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f1():\n    return 1\n\ndef f2():\n    return 1\n", "utf-8")
 
-        def submit(self, *_args: object, **_kwargs: object) -> _Future:
-            return _Future()
+    def _diff(
+        _self: object, _f: dict[str, object], _b: dict[str, object]
+    ) -> tuple[set[str], set[str]]:
+        return new_func, new_block
 
-    monkeypatch.setattr(cli, "ProcessPoolExecutor", _Exec)
-    monkeypatch.setattr(cli, "as_completed", lambda futures: futures)
-    _run_main(monkeypatch, [str(tmp_path), "--no-progress"])
+    monkeypatch.setattr(baseline.Baseline, "diff", _diff)
+    baseline_path = _write_baseline(
+        tmp_path / "baseline.json",
+        python_version=f"{sys.version_info.major}.{sys.version_info.minor}",
+    )
+    _patch_parallel(monkeypatch)
+    with pytest.raises(SystemExit) as exc:
+        _run_main(
+            monkeypatch,
+            [
+                str(tmp_path),
+                "--baseline",
+                str(baseline_path),
+                "--fail-on-new",
+                "--verbose",
+                "--no-progress",
+            ],
+        )
+    assert exc.value.code == 3
     out = capsys.readouterr().out
-    assert "Failed to process batch item" in out
+    if expect_func:
+        assert "Details (function clone hashes):" in out
+    else:
+        assert "Details (function clone hashes):" not in out
+    if expect_block:
+        assert "Details (block clone hashes):" in out
+    else:
+        assert "Details (block clone hashes):" not in out
 
 
-def test_cli_failed_batch_item_progress(
+def test_cli_fail_on_new_verbose_and_report_path(
     tmp_path: Path,
     monkeypatch: pytest.MonkeyPatch,
     capsys: pytest.CaptureFixture[str],
 ) -> None:
     src = tmp_path / "a.py"
-    src.write_text("def f():\n    return 1\n", "utf-8")
+    src.write_text("def f1():\n    return 1\n\ndef f2():\n    return 1\n", "utf-8")
 
-    class _Future:
-        def result(self) -> cli.ProcessingResult:
-            raise RuntimeError("boom")
+    def _diff(
+        _self: object, _f: dict[str, object], _b: dict[str, object]
+    ) -> tuple[set[str], set[str]]:
+        return {"fhash1"}, {"bhash1"}
 
-    class _Exec:
-        def __init__(self, *args: object, **kwargs: object) -> None:
-            return None
+    monkeypatch.setattr(baseline.Baseline, "diff", _diff)
+    baseline_path = tmp_path / "baseline.json"
+    _write_baseline(
+        baseline_path,
+        python_version=f"{sys.version_info.major}.{sys.version_info.minor}",
+    )
+    html_out = tmp_path / "report.html"
+    _patch_parallel(monkeypatch)
+    with pytest.raises(SystemExit) as exc:
+        _run_main(
+            monkeypatch,
+            [
+                str(tmp_path),
+                "--baseline",
+                str(baseline_path),
+                "--fail-on-new",
+                "--verbose",
+                "--html",
+                str(html_out),
+                "--no-progress",
+            ],
+        )
+    assert exc.value.code == 3
+    out = capsys.readouterr().out
+    assert "See detailed report:" in out
+    assert str(html_out) in out
+    assert "Details (function clone hashes):" in out
+    assert "- fhash1" in out
+    assert "Details (block clone hashes):" in out
+    assert "- bhash1" in out
 
-        def __enter__(self) -> _Exec:
-            return self
 
-        def __exit__(
-            self,
-            exc_type: type[BaseException] | None,
-            exc: BaseException | None,
-            tb: object | None,
-        ) -> Literal[False]:
-            return False
+def test_cli_fail_on_new_default_report_path(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f1():\n    return 1\n\ndef f2():\n    return 1\n", "utf-8")
+    report_path = tmp_path / ".cache" / "codeclone" / "report.html"
+    report_path.parent.mkdir(parents=True, exist_ok=True)
+    report_path.write_text("<html>ok</html>", "utf-8")
+    baseline_path = tmp_path / "baseline.json"
+    _write_baseline(
+        baseline_path,
+        python_version=f"{sys.version_info.major}.{sys.version_info.minor}",
+    )
+    monkeypatch.chdir(tmp_path)
+    _patch_parallel(monkeypatch)
+    with pytest.raises(SystemExit) as exc:
+        _run_main(
+            monkeypatch,
+            [
+                str(tmp_path),
+                "--baseline",
+                str(baseline_path),
+                "--fail-on-new",
+                "--min-loc",
+                "1",
+                "--min-stmt",
+                "1",
+                "--no-progress",
+            ],
+        )
+    assert exc.value.code == 3
+    out = capsys.readouterr().out
+    assert "See detailed report:" in out
+    assert ".cache/codeclone/report.html" in out
 
-        def submit(self, *_args: object, **_kwargs: object) -> _Future:
-            return _Future()
 
-    class _DummyProgress:
-        def __init__(self, *args: object, **kwargs: object) -> None:
-            return None
+def test_cli_batch_result_none_no_progress(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f():\n    return 1\n", "utf-8")
+    _patch_fixed_executor(monkeypatch, _FixedFuture(value=None))
+    _run_main(monkeypatch, [str(tmp_path), "--no-progress"])
+    out = capsys.readouterr().out
+    assert "Failed to process batch item" not in out
 
-        def __enter__(self) -> _DummyProgress:
-            return self
 
-        def __exit__(
-            self,
-            exc_type: type[BaseException] | None,
-            exc: BaseException | None,
-            tb: object | None,
-        ) -> Literal[False]:
-            return False
+def test_cli_batch_result_none_progress(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f():\n    return 1\n", "utf-8")
+    monkeypatch.setattr(cli, "Progress", _DummyProgress)
+    _patch_fixed_executor(monkeypatch, _FixedFuture(value=None))
+    _run_main(monkeypatch, [str(tmp_path)])
+    out = capsys.readouterr().out
+    assert "Worker failed" not in out
 
-        def add_task(self, _desc: str, total: int) -> int:
-            return total
 
-        def advance(self, _task: int) -> None:
-            return None
+def test_cli_failed_batch_item_no_progress(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f():\n    return 1\n", "utf-8")
+    _patch_fixed_executor(monkeypatch, _FixedFuture(error=RuntimeError("boom")))
+    _run_main(monkeypatch, [str(tmp_path), "--no-progress"])
+    out = capsys.readouterr().out
+    assert "Failed to process batch item" in out
 
+
+def test_cli_failed_batch_item_progress(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+    capsys: pytest.CaptureFixture[str],
+) -> None:
+    src = tmp_path / "a.py"
+    src.write_text("def f():\n    return 1\n", "utf-8")
     monkeypatch.setattr(cli, "Progress", _DummyProgress)
-    monkeypatch.setattr(cli, "ProcessPoolExecutor", _Exec)
-    monkeypatch.setattr(cli, "as_completed", lambda futures: futures)
+    _patch_fixed_executor(monkeypatch, _FixedFuture(error=RuntimeError("boom")))
     _run_main(monkeypatch, [str(tmp_path)])
     out = capsys.readouterr().out
-    assert "Worker failed" in out or "Failed to process batch item" in out
+    assert "Worker failed" in out
diff --git a/tests/test_cli_main_guard_runpy.py b/tests/test_cli_main_guard_runpy.py
new file mode 100644
index 0000000..f130c4e
--- /dev/null
+++ b/tests/test_cli_main_guard_runpy.py
@@ -0,0 +1,12 @@
+import runpy
+import sys
+
+import pytest
+
+
+def test_cli_main_guard_runpy(monkeypatch: pytest.MonkeyPatch) -> None:
+    monkeypatch.delitem(sys.modules, "codeclone.cli", raising=False)
+    monkeypatch.setattr(sys, "argv", ["codeclone", "--help"])
+    with pytest.raises(SystemExit) as exc:
+        runpy.run_module("codeclone.cli", run_name="__main__")
+    assert exc.value.code == 0
diff --git a/tests/test_cli_smoke.py b/tests/test_cli_smoke.py
index 603ea77..9d36a57 100644
--- a/tests/test_cli_smoke.py
+++ b/tests/test_cli_smoke.py
@@ -11,13 +11,29 @@ def run_cli(
     env = os.environ.copy()
     root_dir = Path(__file__).parents[1]
     env["PYTHONPATH"] = str(root_dir) + os.pathsep + env.get("PYTHONPATH", "")
+    # Keep smoke tests stable under pytest-cov:
+    # subprocess coverage collection is not required here and can create
+    # nondeterministic overhead when child process pools are used.
+    env.pop("COV_CORE_SOURCE", None)
+    env.pop("COV_CORE_CONFIG", None)
+    env.pop("COV_CORE_DATAFILE", None)
+    env.pop("COVERAGE_PROCESS_START", None)
 
     # Try to find venv python
     venv_python = root_dir / ".venv" / "bin" / "python"
     executable = str(venv_python) if venv_python.exists() else sys.executable
 
     return subprocess.run(
-        [executable, "-m", "codeclone.cli", *args],
+        [
+            executable,
+            "-m",
+            "codeclone.cli",
+            *args,
+            "--processes",
+            "1",
+            "--no-progress",
+            "--no-color",
+        ],
         capture_output=True,
         text=True,
         cwd=cwd,
@@ -39,7 +55,8 @@ def f():
     result = run_cli([str(tmp_path)], cwd=tmp_path)
 
     assert result.returncode == 0
-    assert "Total Function Clones" in result.stdout
+    assert "Analysis Summary" in result.stdout
+    assert "Function clone groups" in result.stdout
 
 
 def test_cli_baseline_missing_warning(tmp_path: Path) -> None:
@@ -107,4 +124,4 @@ def f2():
         ]
     )
     assert result2.returncode == 0
-    assert "New Clones (vs Baseline)" in result2.stdout
+    assert "New vs baseline" in result2.stdout
diff --git a/tests/test_cli_unit.py b/tests/test_cli_unit.py
index 85bbf31..a9c3693 100644
--- a/tests/test_cli_unit.py
+++ b/tests/test_cli_unit.py
@@ -1,9 +1,14 @@
 import os
+import sys
 from pathlib import Path
+from typing import cast
 
 import pytest
+from rich.text import Text
 
 import codeclone.cli as cli
+from codeclone import __version__
+from codeclone import ui_messages as ui
 from codeclone.cli import expand_path, process_file
 from codeclone.normalize import NormalizationConfig
 
@@ -67,3 +72,131 @@ def test_process_file_success(tmp_path: Path) -> None:
     result = process_file(str(src), str(tmp_path), NormalizationConfig(), 1, 1)
     assert result.success is True
     assert result.stat is not None
+
+
+def test_cli_module_main_guard(monkeypatch: pytest.MonkeyPatch) -> None:
+    monkeypatch.setattr(sys, "argv", ["codeclone", "--help"])
+    with pytest.raises(SystemExit) as exc:
+        cli.main()
+    assert exc.value.code == 0
+
+
+def test_cli_version_flag_no_side_effects(
+    monkeypatch: pytest.MonkeyPatch, capsys: pytest.CaptureFixture[str]
+) -> None:
+    class _Boom:
+        def __init__(self, *_args: object, **_kwargs: object) -> None:
+            raise AssertionError("Side effect detected")
+
+    monkeypatch.setattr(cli, "Cache", _Boom)
+    monkeypatch.setattr(cli, "Baseline", _Boom)
+    monkeypatch.setattr(sys, "argv", ["codeclone", "--version"])
+    with pytest.raises(SystemExit) as exc:
+        cli.main()
+    assert exc.value.code == 0
+    out = capsys.readouterr().out
+    assert __version__ in out
+    assert "Scanning root" not in out
+    assert "Architectural duplication detector" not in out
+
+
+def test_cli_help_text_consistency(
+    monkeypatch: pytest.MonkeyPatch, capsys: pytest.CaptureFixture[str]
+) -> None:
+    monkeypatch.setattr(sys, "argv", ["codeclone", "--help"])
+    with pytest.raises(SystemExit) as exc:
+        cli.main()
+    assert exc.value.code == 0
+    out = capsys.readouterr().out
+    assert "Default:" in out
+    assert "<root>/.cache/codeclone/cache.json" in out
+    assert "Legacy alias for --cache-path" in out
+    assert "--max-baseline-size-mb MB" in out
+    assert "--max-cache-size-mb MB" in out
+    assert "CI preset: --fail-on-new --no-color --quiet." in out
+    assert "total clone groups (function +" in out
+    assert "block) exceed this number" in out
+
+
+def test_summary_value_style_mapping() -> None:
+    assert cli._summary_value_style(label=ui.SUMMARY_LABEL_FUNCTION, value=0) == "dim"
+    assert (
+        cli._summary_value_style(label=ui.SUMMARY_LABEL_FUNCTION, value=2)
+        == "bold green"
+    )
+    assert (
+        cli._summary_value_style(label=ui.SUMMARY_LABEL_SUPPRESSED, value=1) == "yellow"
+    )
+    assert (
+        cli._summary_value_style(label=ui.SUMMARY_LABEL_NEW_BASELINE, value=3)
+        == "bold red"
+    )
+
+
+def test_build_summary_table_rows_and_styles() -> None:
+    rows = cli._build_summary_rows(
+        files_found=2,
+        files_analyzed=0,
+        cache_hits=2,
+        files_skipped=0,
+        func_clones_count=1,
+        block_clones_count=0,
+        segment_clones_count=0,
+        suppressed_segment_groups=1,
+        new_clones_count=1,
+    )
+    table = cli._build_summary_table(rows)
+    assert table.title == ui.SUMMARY_TITLE
+    assert table.columns[0]._cells == [label for label, _ in rows]
+    value_cells = table.columns[1]._cells
+    assert isinstance(value_cells[0], Text)
+    assert str(value_cells[0]) == "2"
+    assert cast(Text, value_cells[1]).style == "dim"
+    assert cast(Text, value_cells[7]).style == "yellow"
+    assert cast(Text, value_cells[8]).style == "bold red"
+
+
+def test_build_summary_rows_order() -> None:
+    rows = cli._build_summary_rows(
+        files_found=1,
+        files_analyzed=1,
+        cache_hits=0,
+        files_skipped=0,
+        func_clones_count=0,
+        block_clones_count=0,
+        segment_clones_count=0,
+        suppressed_segment_groups=0,
+        new_clones_count=0,
+    )
+    labels = [label for label, _ in rows]
+    assert labels == [
+        ui.SUMMARY_LABEL_FILES_FOUND,
+        ui.SUMMARY_LABEL_FILES_ANALYZED,
+        ui.SUMMARY_LABEL_CACHE_HITS,
+        ui.SUMMARY_LABEL_FILES_SKIPPED,
+        ui.SUMMARY_LABEL_FUNCTION,
+        ui.SUMMARY_LABEL_BLOCK,
+        ui.SUMMARY_LABEL_SEGMENT,
+        ui.SUMMARY_LABEL_SUPPRESSED,
+        ui.SUMMARY_LABEL_NEW_BASELINE,
+    ]
+
+
+def test_print_summary_invariant_warning(
+    monkeypatch: pytest.MonkeyPatch, capsys: pytest.CaptureFixture[str]
+) -> None:
+    monkeypatch.setattr(cli, "console", cli._make_console(no_color=True))
+    cli._print_summary(
+        quiet=False,
+        files_found=1,
+        files_analyzed=0,
+        cache_hits=0,
+        files_skipped=0,
+        func_clones_count=0,
+        block_clones_count=0,
+        segment_clones_count=0,
+        suppressed_segment_groups=0,
+        new_clones_count=0,
+    )
+    out = capsys.readouterr().out
+    assert "Summary accounting mismatch" in out
diff --git a/tests/test_extractor.py b/tests/test_extractor.py
index 6eeaebe..5cbb189 100644
--- a/tests/test_extractor.py
+++ b/tests/test_extractor.py
@@ -22,7 +22,7 @@ def foo():
     return a + b
 """
 
-    units, blocks = extract_units_from_source(
+    units, blocks, segments = extract_units_from_source(
         source=src,
         filepath="x.py",
         module_name="mod",
@@ -36,6 +36,7 @@ def foo():
     assert u.qualname == "mod:foo"
     assert u.loc >= 3
     assert blocks == []
+    assert segments == []
 
 
 def test_init_function_is_ignored_for_blocks() -> None:
@@ -48,7 +49,7 @@ def __init__(self):
         w = 4
 """
 
-    units, blocks = extract_units_from_source(
+    units, blocks, segments = extract_units_from_source(
         source=src,
         filepath="x.py",
         module_name="mod",
@@ -59,6 +60,7 @@ def __init__(self):
 
     assert len(units) == 1
     assert blocks == []
+    assert segments == []
 
 
 def test_parse_timeout_raises(monkeypatch: pytest.MonkeyPatch) -> None:
@@ -104,6 +106,102 @@ def setrlimit(_key: int, _val: tuple[int, int]) -> None:
     assert tree is not None
 
 
+def test_parse_limits_never_lowers_hard_limit(monkeypatch: pytest.MonkeyPatch) -> None:
+    calls: list[tuple[int, int]] = []
+
+    class _DummyResource:
+        RLIMIT_CPU = 0
+        RLIM_INFINITY = 10**9
+
+        @staticmethod
+        def getrlimit(_key: int) -> tuple[int, int]:
+            return (_DummyResource.RLIM_INFINITY, _DummyResource.RLIM_INFINITY)
+
+        @staticmethod
+        def setrlimit(_key: int, val: tuple[int, int]) -> None:
+            calls.append(val)
+            # Simulate a system where changing hard limit would fail.
+            assert val[1] == _DummyResource.RLIM_INFINITY
+
+    monkeypatch.setattr(os, "name", "posix")
+    monkeypatch.setattr(signal, "getsignal", lambda *_args, **_kwargs: None)
+    monkeypatch.setattr(signal, "signal", lambda *_args, **_kwargs: None)
+    monkeypatch.setattr(signal, "setitimer", lambda *_args, **_kwargs: None)
+    monkeypatch.setitem(sys.modules, "resource", _DummyResource)
+
+    with extractor._parse_limits(5):
+        pass
+
+    assert calls
+    # First set lowers only soft limit, hard stays unchanged.
+    assert calls[0] == (5, _DummyResource.RLIM_INFINITY)
+    # Final restore returns to original limits.
+    assert calls[-1] == (
+        _DummyResource.RLIM_INFINITY,
+        _DummyResource.RLIM_INFINITY,
+    )
+
+
+def test_parse_limits_uses_finite_soft_limit_branch(
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    calls: list[tuple[int, int]] = []
+
+    class _DummyResource:
+        RLIMIT_CPU = 0
+        RLIM_INFINITY = 10**9
+
+        @staticmethod
+        def getrlimit(_key: int) -> tuple[int, int]:
+            return (20, 20)
+
+        @staticmethod
+        def setrlimit(_key: int, val: tuple[int, int]) -> None:
+            calls.append(val)
+
+    monkeypatch.setattr(os, "name", "posix")
+    monkeypatch.setattr(signal, "getsignal", lambda *_args, **_kwargs: None)
+    monkeypatch.setattr(signal, "signal", lambda *_args, **_kwargs: None)
+    monkeypatch.setattr(signal, "setitimer", lambda *_args, **_kwargs: None)
+    monkeypatch.setitem(sys.modules, "resource", _DummyResource)
+
+    with extractor._parse_limits(5):
+        pass
+
+    # New soft is min(timeout, old_soft, hard_ceiling), hard is preserved.
+    assert calls[0] == (5, 20)
+    assert calls[-1] == (20, 20)
+
+
+def test_parse_limits_restore_failure_is_ignored(
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    class _DummyResource:
+        RLIMIT_CPU = 0
+        RLIM_INFINITY = 10**9
+        _calls = 0
+
+        @staticmethod
+        def getrlimit(_key: int) -> tuple[int, int]:
+            return (_DummyResource.RLIM_INFINITY, _DummyResource.RLIM_INFINITY)
+
+        @staticmethod
+        def setrlimit(_key: int, _val: tuple[int, int]) -> None:
+            _DummyResource._calls += 1
+            if _DummyResource._calls >= 2:
+                raise RuntimeError("restore denied")
+
+    monkeypatch.setattr(os, "name", "posix")
+    monkeypatch.setattr(signal, "getsignal", lambda *_args, **_kwargs: None)
+    monkeypatch.setattr(signal, "signal", lambda *_args, **_kwargs: None)
+    monkeypatch.setattr(signal, "setitimer", lambda *_args, **_kwargs: None)
+    monkeypatch.setitem(sys.modules, "resource", _DummyResource)
+
+    # Should not raise even if restoring old limits fails.
+    with extractor._parse_limits(5):
+        pass
+
+
 def test_extract_syntax_error() -> None:
     with pytest.raises(ParseError):
         extract_units_from_source(
@@ -122,7 +220,7 @@ def test_extract_respects_min_loc_min_stmt() -> None:
 def f():
     x = 1
 """
-    units, blocks = extract_units_from_source(
+    units, blocks, segments = extract_units_from_source(
         source=src,
         filepath="x.py",
         module_name="mod",
@@ -132,6 +230,7 @@ def f():
     )
     assert units == []
     assert blocks == []
+    assert segments == []
 
 
 def test_extract_block_units_generated() -> None:
@@ -141,7 +240,7 @@ def test_extract_block_units_generated() -> None:
 def f():
 {body_lines}
 """
-    units, blocks = extract_units_from_source(
+    units, blocks, segments = extract_units_from_source(
         source=src,
         filepath="x.py",
         module_name="mod",
@@ -151,6 +250,7 @@ def f():
     )
     assert units
     assert blocks
+    assert segments
 
 
 def test_extract_async_function() -> None:
@@ -158,7 +258,7 @@ def test_extract_async_function() -> None:
 async def af():
     return 1
 """
-    units, blocks = extract_units_from_source(
+    units, blocks, segments = extract_units_from_source(
         source=src,
         filepath="x.py",
         module_name="mod",
@@ -168,6 +268,26 @@ async def af():
     )
     assert len(units) == 1
     assert blocks == []
+    assert segments == []
+
+
+def test_extract_handles_long_line() -> None:
+    long_line = 'x = "1" * 10000'
+    src = f"""
+def f():
+    {long_line}
+"""
+    units, blocks, segments = extract_units_from_source(
+        source=src,
+        filepath="x.py",
+        module_name="mod",
+        cfg=NormalizationConfig(),
+        min_loc=1,
+        min_stmt=1,
+    )
+    assert units
+    assert blocks == []
+    assert segments == []
 
 
 def test_extract_skips_invalid_positions(monkeypatch: pytest.MonkeyPatch) -> None:
@@ -185,7 +305,7 @@ def _fake_parse(_source: str, _timeout_s: int) -> ast.AST:
         return tree
 
     monkeypatch.setattr(extractor, "_parse_with_limits", _fake_parse)
-    units, blocks = extract_units_from_source(
+    units, blocks, segments = extract_units_from_source(
         source="def f():\n    return 1\n",
         filepath="x.py",
         module_name="mod",
@@ -195,6 +315,27 @@ def _fake_parse(_source: str, _timeout_s: int) -> ast.AST:
     )
     assert units == []
     assert blocks == []
+    assert segments == []
+
+
+def test_extract_distinguishes_call_targets() -> None:
+    src = """
+def load(x):
+    return load_user(x)
+
+def delete(x):
+    return delete_user(x)
+"""
+    units, _, _ = extract_units_from_source(
+        source=src,
+        filepath="x.py",
+        module_name="mod",
+        cfg=NormalizationConfig(),
+        min_loc=1,
+        min_stmt=1,
+    )
+    fps = {u.qualname: u.fingerprint for u in units}
+    assert fps["mod:load"] != fps["mod:delete"]
 
 
 def test_parse_limits_triggers_timeout(monkeypatch: pytest.MonkeyPatch) -> None:
diff --git a/tests/test_html_report.py b/tests/test_html_report.py
index 19cde1f..431d088 100644
--- a/tests/test_html_report.py
+++ b/tests/test_html_report.py
@@ -1,4 +1,5 @@
 import importlib
+import json
 from pathlib import Path
 
 import pytest
@@ -8,13 +9,18 @@
     _FileCache,
     _prefix_css,
     _pygments_css,
+    _render_code_block,
     _try_pygments,
     build_html_report,
+    pairwise,
 )
+from codeclone.report import to_json_report
 
 
 def test_html_report_empty() -> None:
-    html = build_html_report(func_groups={}, block_groups={}, title="Empty Report")
+    html = build_html_report(
+        func_groups={}, block_groups={}, segment_groups={}, title="Empty Report"
+    )
     assert "<!doctype html>" in html
     assert "Empty Report" in html
     assert "No code clones detected" in html
@@ -36,6 +42,7 @@ def test_html_report_generation(tmp_path: Path) -> None:
     html = build_html_report(
         func_groups=func_groups,
         block_groups={},
+        segment_groups={},
         title="Test Report",
         context_lines=1,
         max_snippet_lines=10,
@@ -47,6 +54,245 @@ def test_html_report_generation(tmp_path: Path) -> None:
     assert "codebox" in html
 
 
+def test_html_report_group_and_item_metadata_attrs(tmp_path: Path) -> None:
+    f = tmp_path / "a.py"
+    f.write_text("def f():\n    return 1\n", "utf-8")
+    html = build_html_report(
+        func_groups={
+            "hash1": [
+                {
+                    "qualname": "pkg.mod:f",
+                    "filepath": str(f),
+                    "start_line": 1,
+                    "end_line": 2,
+                }
+            ]
+        },
+        block_groups={},
+        segment_groups={},
+        title="Attrs",
+    )
+    assert 'data-group-key="hash1"' in html
+    assert '<code class="gkey" title="hash1">hash1</code>' in html
+    assert 'data-qualname="pkg.mod:f"' in html
+    assert 'data-filepath="' in html
+    assert 'data-start-line="1"' in html
+    assert 'data-end-line="2"' in html
+
+
+def test_html_report_command_palette_full_actions_present() -> None:
+    html = build_html_report(func_groups={}, block_groups={}, segment_groups={})
+    assert "Export as PDF" in html
+    assert "window.print();" in html
+    assert "No matching commands" in html
+    assert "ArrowDown" in html
+    assert "ArrowUp" in html
+    assert "Chart feature coming soon" not in html
+    assert "Clone Group Distribution" in html
+    assert 'id="stats-dashboard" style="display: none;"' in html
+
+
+def test_html_report_includes_provenance_metadata(tmp_path: Path) -> None:
+    f = tmp_path / "a.py"
+    f.write_text("def f():\n    return 1\n", "utf-8")
+    html = build_html_report(
+        func_groups={
+            "h1": [
+                {
+                    "qualname": "f",
+                    "filepath": str(f),
+                    "start_line": 1,
+                    "end_line": 2,
+                }
+            ]
+        },
+        block_groups={},
+        segment_groups={},
+        report_meta={
+            "codeclone_version": "1.3.0",
+            "python_version": "3.13",
+            "baseline_path": "/repo/codeclone.baseline.json",
+            "baseline_version": "1.3.0",
+            "baseline_schema_version": 1,
+            "baseline_python_version": "3.13",
+            "baseline_loaded": True,
+            "baseline_status": "ok",
+            "cache_path": "/repo/.cache/codeclone/cache.json",
+            "cache_used": True,
+        },
+    )
+    assert "Report Provenance" in html
+    assert "CodeClone" in html
+    assert "Baseline schema" in html
+    assert 'data-baseline-status="ok"' in html
+    assert "/repo/codeclone.baseline.json" in html
+    assert 'data-cache-used="true"' in html
+
+
+def test_html_report_escapes_meta_and_title(tmp_path: Path) -> None:
+    f = tmp_path / "a.py"
+    f.write_text("def f():\n    return 1\n", "utf-8")
+    html = build_html_report(
+        func_groups={
+            "h1": [
+                {
+                    "qualname": "f",
+                    "filepath": str(f),
+                    "start_line": 1,
+                    "end_line": 2,
+                }
+            ]
+        },
+        block_groups={},
+        segment_groups={},
+        title='<img src=x onerror="alert(1)">',
+        report_meta={
+            "baseline_path": '"/><script>alert(1)</script>',
+            "cache_path": 'x" onmouseover="alert(1)',
+            "baseline_status": "ok",
+        },
+    )
+    assert "<script>alert(1)</script>" not in html
+    assert "&lt;img src=x onerror=&quot;alert(1)&quot;&gt;" in html
+    assert "&lt;script&gt;alert(1)&lt;/script&gt;" in html
+    assert (
+        'data-baseline-path="&quot;/&gt;&lt;script&gt;alert(1)&lt;/script&gt;"' in html
+    )
+    assert 'data-cache-path="x&quot; onmouseover=&quot;alert(1)"' in html
+
+
+def test_html_report_escapes_script_breakout_payload(tmp_path: Path) -> None:
+    f = tmp_path / "a.py"
+    f.write_text("def f():\n    return 1\n", "utf-8")
+    payload = "</script><script>alert(1)</script>"
+    html = build_html_report(
+        func_groups={
+            "h1": [
+                {
+                    "qualname": payload,
+                    "filepath": str(f),
+                    "start_line": 1,
+                    "end_line": 2,
+                }
+            ]
+        },
+        block_groups={},
+        segment_groups={},
+        report_meta={"baseline_path": payload},
+        title=payload,
+    )
+    assert "</script><script>" not in html
+    assert "&lt;/script&gt;&lt;script&gt;" in html
+
+
+def test_html_report_deterministic_group_order(tmp_path: Path) -> None:
+    a_file = tmp_path / "a.py"
+    b_file = tmp_path / "b.py"
+    a_file.write_text("def a():\n    return 1\n", "utf-8")
+    b_file.write_text("def b():\n    return 2\n", "utf-8")
+    func_groups = {
+        "b": [
+            {
+                "qualname": "b",
+                "filepath": str(b_file),
+                "start_line": 1,
+                "end_line": 2,
+                "loc": 2,
+            }
+        ],
+        "a": [
+            {
+                "qualname": "a",
+                "filepath": str(a_file),
+                "start_line": 1,
+                "end_line": 2,
+                "loc": 2,
+            }
+        ],
+    }
+    html = build_html_report(
+        func_groups=func_groups,
+        block_groups={},
+        segment_groups={},
+    )
+    a_idx = html.find('data-group-key="a"')
+    b_idx = html.find('data-group-key="b"')
+    assert a_idx != -1
+    assert b_idx != -1
+    assert a_idx < b_idx
+
+
+def test_html_and_json_group_order_consistent(tmp_path: Path) -> None:
+    a_file = tmp_path / "a.py"
+    b_file = tmp_path / "b.py"
+    c_file = tmp_path / "c.py"
+    a_file.write_text("def a():\n    return 1\n", "utf-8")
+    b_file.write_text("def b():\n    return 1\n", "utf-8")
+    c_file.write_text("def c():\n    return 1\n", "utf-8")
+    groups = {
+        "b": [
+            {
+                "qualname": "b",
+                "filepath": str(b_file),
+                "start_line": 1,
+                "end_line": 2,
+            }
+        ],
+        "a": [
+            {
+                "qualname": "a",
+                "filepath": str(a_file),
+                "start_line": 1,
+                "end_line": 2,
+            }
+        ],
+        "c": [
+            {
+                "qualname": "c1",
+                "filepath": str(c_file),
+                "start_line": 1,
+                "end_line": 2,
+            },
+            {
+                "qualname": "c2",
+                "filepath": str(c_file),
+                "start_line": 1,
+                "end_line": 2,
+            },
+        ],
+    }
+    html = build_html_report(func_groups=groups, block_groups={}, segment_groups={})
+    json_report = json.loads(to_json_report(groups, {}, {}))
+    json_keys = list(json_report["function_clones"].keys())
+    assert json_keys == ["c", "a", "b"]
+    assert html.find('data-group-key="c"') < html.find('data-group-key="a"')
+    assert html.find('data-group-key="a"') < html.find('data-group-key="b"')
+
+
+def test_html_report_escapes_control_chars_in_payload(tmp_path: Path) -> None:
+    f = tmp_path / "a.py"
+    f.write_text("def f():\n    return 1\n", "utf-8")
+    qualname = "q`</div>\u2028\u2029"
+    html = build_html_report(
+        func_groups={
+            "h1": [
+                {
+                    "qualname": qualname,
+                    "filepath": str(f),
+                    "start_line": 1,
+                    "end_line": 2,
+                }
+            ]
+        },
+        block_groups={},
+        segment_groups={},
+    )
+    assert "&lt;/div&gt;" in html
+    assert "&#96;" in html
+    assert "&#8232;" in html
+    assert "&#8233;" in html
+
+
 def test_file_cache_reads_ranges(tmp_path: Path) -> None:
     f = tmp_path / "sample.py"
     f.write_text("\n".join([f"line{i}" for i in range(1, 21)]), "utf-8")
@@ -68,6 +314,27 @@ def test_file_cache_missing_file(tmp_path: Path) -> None:
         cache.get_lines_range(str(missing), 1, 2)
 
 
+def test_html_report_missing_source_snippet_fallback(tmp_path: Path) -> None:
+    missing = tmp_path / "missing.py"
+    html = build_html_report(
+        func_groups={
+            "h1": [
+                {
+                    "qualname": "f",
+                    "filepath": str(missing),
+                    "start_line": 1,
+                    "end_line": 2,
+                }
+            ]
+        },
+        block_groups={},
+        segment_groups={},
+        title="Missing Source",
+    )
+    assert "Missing Source" in html
+    assert "Source file unavailable" in html
+
+
 def test_file_cache_unicode_fallback(tmp_path: Path) -> None:
     f = tmp_path / "bad.py"
     f.write_bytes(b"\xff\xfe\xff\n")
@@ -102,6 +369,7 @@ def test_render_code_block_truncate(tmp_path: Path) -> None:
             ]
         },
         block_groups={},
+        segment_groups={},
         title="Truncate",
         context_lines=10,
         max_snippet_lines=5,
@@ -117,6 +385,12 @@ def test_prefix_css() -> None:
     assert "/* c */" in prefixed
 
 
+def test_prefix_css_empty_selector_passthrough() -> None:
+    css = "   { color: red; }\n"
+    prefixed = _prefix_css(css, ".wrap")
+    assert "{ color: red; }" in prefixed
+
+
 def test_pygments_css() -> None:
     css = _pygments_css("default")
     assert ".codebox" in css or css == ""
@@ -148,6 +422,26 @@ def test_try_pygments_ok() -> None:
     assert result is None or isinstance(result, str)
 
 
+def test_render_code_block_without_pygments_uses_escaped_fallback(
+    tmp_path: Path, monkeypatch: pytest.MonkeyPatch
+) -> None:
+    import codeclone._html_snippets as snippets
+
+    src = tmp_path / "a.py"
+    src.write_text("x = '<tag>'\n", "utf-8")
+    monkeypatch.setattr(snippets, "_try_pygments", lambda _raw: None)
+    snippet = _render_code_block(
+        filepath=str(src),
+        start_line=1,
+        end_line=1,
+        file_cache=_FileCache(),
+        context=0,
+        max_lines=10,
+    )
+    assert "&lt;tag&gt;" in snippet.code_html
+    assert 'class="hitline"' in snippet.code_html
+
+
 def test_html_report_with_blocks(tmp_path: Path) -> None:
     f1 = tmp_path / "a.py"
     f1.write_text("def f1():\n    pass\n", "utf-8")
@@ -172,7 +466,12 @@ def test_html_report_with_blocks(tmp_path: Path) -> None:
             },
         ]
     }
-    html = build_html_report(func_groups={}, block_groups=block_groups, title="Blocks")
+    html = build_html_report(
+        func_groups={},
+        block_groups=block_groups,
+        segment_groups={},
+        title="Blocks",
+    )
     assert "Block clones" in html
 
 
@@ -185,10 +484,90 @@ def _fake_css(name: str) -> str:
         return "x"
 
     monkeypatch.setattr(hr, "_pygments_css", _fake_css)
-    html = build_html_report(func_groups={}, block_groups={}, title="Pygments")
+    html = build_html_report(
+        func_groups={}, block_groups={}, segment_groups={}, title="Pygments"
+    )
     assert "Pygments" in html
 
 
+def test_html_report_segments_section(tmp_path: Path) -> None:
+    f = tmp_path / "a.py"
+    f.write_text("def f():\n    x = 1\n    y = 2\n", "utf-8")
+    segment_groups = {
+        "s1|mod:f": [
+            {
+                "qualname": "mod:f",
+                "filepath": str(f),
+                "start_line": 1,
+                "end_line": 2,
+                "size": 2,
+            },
+            {
+                "qualname": "mod:f",
+                "filepath": str(f),
+                "start_line": 2,
+                "end_line": 3,
+                "size": 2,
+            },
+        ]
+    }
+    html = build_html_report(
+        func_groups={},
+        block_groups={},
+        segment_groups=segment_groups,
+        title="Segments",
+    )
+    assert "Segment clones" in html
+
+
+def test_html_report_single_item_group(tmp_path: Path) -> None:
+    f = tmp_path / "a.py"
+    f.write_text("def f():\n    x = 1\n", "utf-8")
+    segment_groups = {
+        "s1|mod:f": [
+            {
+                "qualname": "mod:f",
+                "filepath": str(f),
+                "start_line": 1,
+                "end_line": 2,
+                "size": 2,
+            }
+        ]
+    }
+    html = build_html_report(
+        func_groups={},
+        block_groups={},
+        segment_groups=segment_groups,
+        title="Segments",
+    )
+    assert f"{f}:1-2" in html
+
+
+def test_pairwise_helper() -> None:
+    assert list(pairwise([1, 2, 3])) == [(1, 2), (2, 3)]
+
+
+def test_render_code_block_truncates_and_fallback(
+    tmp_path: Path, monkeypatch: pytest.MonkeyPatch
+) -> None:
+    f = tmp_path / "a.py"
+    f.write_text("\n".join([f"line{i}" for i in range(1, 30)]), "utf-8")
+
+    import codeclone.html_report as hr
+
+    monkeypatch.setattr(hr, "_try_pygments", lambda _text: None)
+    cache = _FileCache(maxsize=2)
+    snippet = hr._render_code_block(
+        filepath=str(f),
+        start_line=1,
+        end_line=20,
+        file_cache=cache,
+        context=5,
+        max_lines=5,
+    )
+    assert "codebox" in snippet.code_html
+
+
 def test_pygments_css_get_style_defs_error(monkeypatch: pytest.MonkeyPatch) -> None:
     class _Fmt:
         def __init__(self, *args: object, **kwargs: object) -> None:
diff --git a/tests/test_normalize.py b/tests/test_normalize.py
index 00cf715..1310571 100644
--- a/tests/test_normalize.py
+++ b/tests/test_normalize.py
@@ -1,39 +1,66 @@
 import ast
+from typing import Any, cast
 
-from codeclone.normalize import NormalizationConfig, normalized_ast_dump
+import pytest
 
+import codeclone.normalize as normalize_mod
+from codeclone.meta_markers import CFG_META_PREFIX
+from codeclone.normalize import (
+    NormalizationConfig,
+    normalized_ast_dump,
+    normalized_ast_dump_from_list,
+)
 
-def test_normalization_ignores_variable_names() -> None:
-    src1 = """
+
+def _normalized_dump(source: str, cfg: NormalizationConfig) -> str:
+    node = ast.parse(source).body[0]
+    return normalized_ast_dump(node, cfg)
+
+
+def _assert_normalized_equal(
+    source_a: str, source_b: str, cfg: NormalizationConfig
+) -> None:
+    assert _normalized_dump(source_a, cfg) == _normalized_dump(source_b, cfg)
+
+
+def _assert_normalized_not_equal(
+    source_a: str, source_b: str, cfg: NormalizationConfig
+) -> None:
+    assert _normalized_dump(source_a, cfg) != _normalized_dump(source_b, cfg)
+
+
+@pytest.mark.parametrize(
+    ("src1", "src2"),
+    [
+        (
+            """
 def f():
     x = 1
     return x
-"""
-    src2 = """
+""",
+            """
 def f():
     y = 2
     return y
-"""
-
-    cfg = NormalizationConfig()
-    a1 = ast.parse(src1).body[0]
-    a2 = ast.parse(src2).body[0]
-
-    assert normalized_ast_dump(a1, cfg) == normalized_ast_dump(a2, cfg)
-
-
-def test_normalization_docstring_removed() -> None:
-    src1 = '''
+""",
+        ),
+        (
+            '''
 def f():
     """doc"""
     x = 1
     return x
-'''
-    src2 = """
+''',
+            """
 def f():
     x = 1
     return x
-"""
+""",
+        ),
+    ],
+    ids=["ignore_var_names", "drop_docstring"],
+)
+def test_normalization_equivalent_sources(src1: str, src2: str) -> None:
     cfg = NormalizationConfig()
     a1 = ast.parse(src1).body[0]
     a2 = ast.parse(src2).body[0]
@@ -85,6 +112,265 @@ def f():
     assert normalized_ast_dump(a1, cfg) == normalized_ast_dump(a2, cfg)
 
 
+def test_normalization_augassign_target_without_ctx() -> None:
+    node = ast.AugAssign(
+        target=cast(Any, ast.Constant(value=1)),
+        op=ast.Add(),
+        value=ast.Constant(value=2),
+    )
+    node.lineno = 1
+    node.col_offset = 0
+    cfg = NormalizationConfig()
+    dump = normalized_ast_dump_from_list([node], cfg)
+    assert "Assign" in dump
+
+
+def test_normalization_unary_non_not_preserved() -> None:
+    src = """
+def f(x):
+    return -x
+"""
+    cfg = NormalizationConfig(normalize_names=False)
+    node = ast.parse(src).body[0]
+    dump = normalized_ast_dump(node, cfg)
+    assert "UnaryOp" in dump
+
+
+def test_normalization_not_non_compare_preserved() -> None:
+    src = """
+def f(x):
+    return not x
+"""
+    cfg = NormalizationConfig(normalize_names=False)
+    node = ast.parse(src).body[0]
+    dump = normalized_ast_dump(node, cfg)
+    assert "Not" in dump
+
+
+def test_normalization_commutative_binop_reorders() -> None:
+    src1 = """
+def f():
+    return 1 + 2
+"""
+    src2 = """
+def f():
+    return 2 + 1
+"""
+    cfg = NormalizationConfig(normalize_constants=False)
+    a1 = ast.parse(src1).body[0]
+    a2 = ast.parse(src2).body[0]
+    assert normalized_ast_dump(a1, cfg) == normalized_ast_dump(a2, cfg)
+
+
+@pytest.mark.parametrize(
+    ("src1", "src2"),
+    [
+        (
+            """
+def f():
+    return a + b
+""",
+            """
+def f():
+    return b + a
+""",
+        ),
+        (
+            """
+def f():
+    return foo() + bar()
+""",
+            """
+def f():
+    return bar() + foo()
+""",
+        ),
+    ],
+    ids=["name_operands", "call_operands"],
+)
+def test_normalization_commutative_binop_not_reordered(src1: str, src2: str) -> None:
+    cfg = NormalizationConfig(
+        normalize_names=False,
+        normalize_attributes=False,
+        normalize_constants=False,
+    )
+    _assert_normalized_not_equal(src1, src2, cfg)
+
+
+def test_normalization_preserves_call_target_names() -> None:
+    src1 = """
+def f(x):
+    return load_user(x)
+"""
+    src2 = """
+def f(x):
+    return delete_user(x)
+"""
+    cfg = NormalizationConfig()
+    a1 = ast.parse(src1).body[0]
+    a2 = ast.parse(src2).body[0]
+    assert normalized_ast_dump(a1, cfg) != normalized_ast_dump(a2, cfg)
+
+
+def test_normalization_preserves_call_target_attributes() -> None:
+    src1 = """
+def f():
+    return svc.load_user()
+"""
+    src2 = """
+def f():
+    return svc.delete_user()
+"""
+    cfg = NormalizationConfig()
+    a1 = ast.parse(src1).body[0]
+    a2 = ast.parse(src2).body[0]
+    assert normalized_ast_dump(a1, cfg) != normalized_ast_dump(a2, cfg)
+
+
+@pytest.mark.parametrize(
+    ("src1", "src2"),
+    [
+        (
+            """
+def f():
+    x = 1
+    return process(payload=x)
+""",
+            """
+def f():
+    y = 2
+    return process(payload=y)
+""",
+        ),
+        (
+            """
+def f():
+    handlers = [run]
+    return handlers[0]()
+""",
+            """
+def f():
+    callbacks = [run]
+    return callbacks[0]()
+""",
+        ),
+    ],
+    ids=["call_keyword_values", "non_name_call_target"],
+)
+def test_normalization_call_values_normalize(src1: str, src2: str) -> None:
+    cfg = NormalizationConfig()
+    _assert_normalized_equal(src1, src2, cfg)
+
+
+def test_normalization_preserves_attribute_call_target_with_call_value() -> None:
+    src1 = """
+def f():
+    return factory_a().run()
+"""
+    src2 = """
+def f():
+    return factory_b().run()
+"""
+    cfg = NormalizationConfig()
+    a1 = ast.parse(src1).body[0]
+    a2 = ast.parse(src2).body[0]
+    assert normalized_ast_dump(a1, cfg) != normalized_ast_dump(a2, cfg)
+
+
+def test_commutative_operand_recursive_and_constant_guards() -> None:
+    nested = ast.parse("(1 + 2) + 3", mode="eval").body
+    assert isinstance(nested, ast.BinOp)
+    assert normalize_mod._is_proven_commutative_operand(nested, ast.Add())
+    assert not normalize_mod._is_proven_commutative_constant(True, ast.BitOr())
+    assert not normalize_mod._is_proven_commutative_constant("x", ast.Add())
+    assert not normalize_mod._is_proven_commutative_constant(1, ast.Sub())
+
+
+def test_normalization_preserves_semantic_marker_names() -> None:
+    fn = ast.FunctionDef(
+        name="f",
+        args=ast.arguments(
+            posonlyargs=[],
+            args=[],
+            kwonlyargs=[],
+            kw_defaults=[],
+            defaults=[],
+        ),
+        body=[
+            ast.Expr(
+                value=ast.Name(
+                    id=f"{CFG_META_PREFIX}MATCH_PATTERN:MatchValue(Constant(value=1))",
+                    ctx=ast.Load(),
+                )
+            )
+        ],
+        decorator_list=[],
+    )
+    module = ast.Module(body=[fn], type_ignores=[])
+    module = ast.fix_missing_locations(module)
+    node = module.body[0]
+    assert isinstance(node, ast.FunctionDef)
+    cfg = NormalizationConfig()
+    dump = normalized_ast_dump(node, cfg)
+    assert f"{CFG_META_PREFIX}MATCH_PATTERN:MatchValue(Constant(value=1))" in dump
+
+
+def test_normalization_non_commutative_binop_not_reordered() -> None:
+    src1 = """
+def f():
+    return a - b
+"""
+    src2 = """
+def f():
+    return b - a
+"""
+    cfg = NormalizationConfig(normalize_names=False)
+    a1 = ast.parse(src1).body[0]
+    a2 = ast.parse(src2).body[0]
+    assert normalized_ast_dump(a1, cfg) != normalized_ast_dump(a2, cfg)
+
+
+def test_normalization_not_in_and_is_not_equivalence() -> None:
+    src1 = """
+def f(x, y):
+    return not (x in y)
+"""
+    src2 = """
+def f(x, y):
+    return x not in y
+"""
+    src3 = """
+def f(x, y):
+    return not (x is y)
+"""
+    src4 = """
+def f(x, y):
+    return x is not y
+"""
+    cfg = NormalizationConfig(normalize_names=False)
+    a1 = ast.parse(src1).body[0]
+    a2 = ast.parse(src2).body[0]
+    a3 = ast.parse(src3).body[0]
+    a4 = ast.parse(src4).body[0]
+    assert normalized_ast_dump(a1, cfg) == normalized_ast_dump(a2, cfg)
+    assert normalized_ast_dump(a3, cfg) == normalized_ast_dump(a4, cfg)
+
+
+def test_normalization_no_demorgan() -> None:
+    src1 = """
+def f(x, y):
+    return not (x == y)
+"""
+    src2 = """
+def f(x, y):
+    return x != y
+"""
+    cfg = NormalizationConfig(normalize_names=False)
+    a1 = ast.parse(src1).body[0]
+    a2 = ast.parse(src2).body[0]
+    assert normalized_ast_dump(a1, cfg) != normalized_ast_dump(a2, cfg)
+
+
 def test_normalization_flags_false_preserve_details() -> None:
     src = """
 def f(x: int, /, y: int, *, z: int, **k: int) -> int:
diff --git a/tests/test_report.py b/tests/test_report.py
index dec2aea..0f16b59 100644
--- a/tests/test_report.py
+++ b/tests/test_report.py
@@ -1,9 +1,19 @@
+import ast
+import json
+from pathlib import Path
+from typing import cast
+
+import pytest
+
+import codeclone.report as report_mod
 from codeclone.report import (
     build_block_groups,
     build_groups,
+    build_segment_groups,
+    prepare_segment_report_groups,
     to_json,
     to_json_report,
-    to_text,
+    to_text_report,
 )
 
 
@@ -58,10 +68,691 @@ def test_report_output_formats() -> None:
             },
         ],
     }
+    meta = {
+        "codeclone_version": "1.3.0",
+        "python_version": "3.13",
+        "baseline_path": "/tmp/codeclone.baseline.json",
+        "baseline_version": "1.3.0",
+        "baseline_schema_version": 1,
+        "baseline_python_version": "3.13",
+        "baseline_loaded": True,
+        "baseline_status": "ok",
+        "cache_path": "/tmp/cache.json",
+        "cache_used": True,
+    }
     json_out = to_json(groups)
-    report_out = to_json_report(groups, groups)
-    text_out = to_text(groups)
+    report_out = to_json_report(groups, groups, {}, meta)
+    text_out = to_text_report(
+        meta=meta,
+        func_groups=groups,
+        block_groups=groups,
+        segment_groups={},
+    )
 
     assert "group_count" in json_out
-    assert '"functions"' in report_out
+    assert '"meta"' in report_out
+    assert '"function_clones"' in report_out
+    assert '"baseline_schema_version": 1' in report_out
+    assert "REPORT METADATA" in text_out
+    assert "Baseline schema version: 1" in text_out
     assert "Clone group #1" in text_out
+
+
+def test_report_json_deterministic_group_order() -> None:
+    groups_a = {
+        "b": [
+            {
+                "qualname": "b",
+                "filepath": "b.py",
+                "start_line": 2,
+                "end_line": 3,
+                "loc": 2,
+            }
+        ],
+        "a": [
+            {
+                "qualname": "a",
+                "filepath": "a.py",
+                "start_line": 1,
+                "end_line": 2,
+                "loc": 2,
+            }
+        ],
+    }
+    groups_b = {"a": groups_a["a"], "b": groups_a["b"]}
+    meta = {"codeclone_version": "1.3.0"}
+    out_a = to_json_report(groups_a, groups_a, groups_a, meta)
+    out_b = to_json_report(groups_b, groups_b, groups_b, meta)
+    assert out_a == out_b
+
+
+def test_report_json_group_order_prefers_size_then_key() -> None:
+    groups = {
+        "b": [
+            {
+                "qualname": "b",
+                "filepath": "b.py",
+                "start_line": 2,
+                "end_line": 3,
+                "loc": 2,
+            }
+        ],
+        "a": [
+            {
+                "qualname": "a",
+                "filepath": "a.py",
+                "start_line": 1,
+                "end_line": 2,
+                "loc": 2,
+            }
+        ],
+        "c": [
+            {
+                "qualname": "c1",
+                "filepath": "c.py",
+                "start_line": 1,
+                "end_line": 2,
+                "loc": 2,
+            },
+            {
+                "qualname": "c2",
+                "filepath": "c.py",
+                "start_line": 3,
+                "end_line": 4,
+                "loc": 2,
+            },
+        ],
+    }
+    payload = to_json_report(groups, {}, {}, {"codeclone_version": "1.3.0"})
+    report_obj = json.loads(payload)
+    assert list(report_obj["function_clones"].keys()) == ["c", "a", "b"]
+
+
+def test_report_json_deterministic_with_shuffled_units() -> None:
+    units_a = [
+        {
+            "fingerprint": "abc",
+            "loc_bucket": "0-19",
+            "qualname": "b",
+            "filepath": "b.py",
+            "start_line": 2,
+            "end_line": 3,
+            "loc": 2,
+        },
+        {
+            "fingerprint": "abc",
+            "loc_bucket": "0-19",
+            "qualname": "a",
+            "filepath": "a.py",
+            "start_line": 1,
+            "end_line": 2,
+            "loc": 2,
+        },
+    ]
+    units_b = list(reversed(units_a))
+    groups_a = build_groups(units_a)
+    groups_b = build_groups(units_b)
+    meta = {"codeclone_version": "1.3.0"}
+    out_a = to_json_report(groups_a, {}, {}, meta)
+    out_b = to_json_report(groups_b, {}, {}, meta)
+    assert out_a == out_b
+
+
+def test_text_report_deterministic_group_order() -> None:
+    groups = {
+        "b": [
+            {
+                "qualname": "b",
+                "filepath": "b.py",
+                "start_line": 2,
+                "end_line": 3,
+                "loc": 2,
+            }
+        ],
+        "a": [
+            {
+                "qualname": "a",
+                "filepath": "a.py",
+                "start_line": 1,
+                "end_line": 2,
+                "loc": 2,
+            }
+        ],
+    }
+    text = report_mod.to_text(groups)
+    first_idx = text.find("Clone group #1")
+    a_idx = text.find("a.py")
+    b_idx = text.find("b.py")
+    assert first_idx != -1
+    assert a_idx != -1
+    assert b_idx != -1
+    assert a_idx < b_idx
+
+
+def test_to_text_report_handles_missing_meta_fields() -> None:
+    text_out = to_text_report(
+        meta={},
+        func_groups={},
+        block_groups={},
+        segment_groups={},
+    )
+    assert "CodeClone version: n/a" in text_out
+    assert "Baseline status: n/a" in text_out
+    assert "Cache path:" not in text_out
+    assert "Cache used:" not in text_out
+    assert "FUNCTION CLONES\n(none)" in text_out
+    assert "BLOCK CLONES\n(none)" in text_out
+    assert "SEGMENT CLONES\n(none)" in text_out
+
+
+def test_segment_groups_internal_only() -> None:
+    segments = [
+        {
+            "segment_sig": "sig1",
+            "segment_hash": "h1",
+            "qualname": "mod:f",
+            "filepath": "a.py",
+            "start_line": 1,
+            "end_line": 4,
+            "size": 4,
+        },
+        {
+            "segment_sig": "sig1",
+            "segment_hash": "h1",
+            "qualname": "mod:f",
+            "filepath": "a.py",
+            "start_line": 10,
+            "end_line": 13,
+            "size": 4,
+        },
+        {
+            "segment_sig": "sig1",
+            "segment_hash": "h1",
+            "qualname": "mod:g",
+            "filepath": "b.py",
+            "start_line": 1,
+            "end_line": 4,
+            "size": 4,
+        },
+    ]
+
+    groups = build_segment_groups(segments)
+    assert len(groups) == 1
+    group_items = next(iter(groups.values()))
+    assert all(item["qualname"] == "mod:f" for item in group_items)
+
+
+def test_segment_groups_filters_small_candidates() -> None:
+    segments = [
+        {
+            "segment_sig": "sig1",
+            "segment_hash": "h1",
+            "qualname": "mod:f",
+            "filepath": "a.py",
+            "start_line": 1,
+            "end_line": 2,
+            "size": 2,
+        }
+    ]
+    groups = build_segment_groups(segments)
+    assert groups == {}
+
+
+def test_segment_groups_merge_overlaps(tmp_path: Path) -> None:
+    src = "\n".join(
+        [
+            "def f():",
+            "    if True:",
+            "        x = 1",
+            "    y = 2",
+            "    z = 3",
+            "    w = 4",
+            "    t = 5",
+            "    u = 6",
+            "    v = 7",
+        ]
+    )
+    f = tmp_path / "a.py"
+    f.write_text(src, "utf-8")
+    group = {
+        "seg|mod:f": [
+            {
+                "segment_sig": "sig",
+                "segment_hash": "hash",
+                "qualname": "mod:f",
+                "filepath": str(f),
+                "start_line": 2,
+                "end_line": 4,
+                "size": 3,
+            },
+            {
+                "segment_sig": "sig",
+                "segment_hash": "hash",
+                "qualname": "mod:f",
+                "filepath": str(f),
+                "start_line": 4,
+                "end_line": 6,
+                "size": 3,
+            },
+            {
+                "segment_sig": "sig",
+                "segment_hash": "hash",
+                "qualname": "mod:f",
+                "filepath": str(f),
+                "start_line": 8,
+                "end_line": 9,
+                "size": 2,
+            },
+        ]
+    }
+    filtered, suppressed = prepare_segment_report_groups(group)
+    assert suppressed == 0
+    items = filtered["seg|mod:f"]
+    assert len(items) == 2
+    assert items[0]["start_line"] == 2
+    assert items[0]["end_line"] == 6
+    assert items[1]["start_line"] == 8
+    assert items[1]["end_line"] == 9
+
+
+def test_segment_groups_suppress_boilerplate(tmp_path: Path) -> None:
+    src = "\n".join(
+        [
+            "def f():",
+            "    self.a = 1",
+            "    self.b = 2",
+            "    self.c = 3",
+            "    self.d = factory()",
+            "    self.e = 5",
+        ]
+    )
+    f = tmp_path / "a.py"
+    f.write_text(src, "utf-8")
+    group = {
+        "seg|mod:f": [
+            {
+                "segment_sig": "sig",
+                "segment_hash": "hash",
+                "qualname": "mod:f",
+                "filepath": str(f),
+                "start_line": 2,
+                "end_line": 6,
+                "size": 5,
+            },
+            {
+                "segment_sig": "sig",
+                "segment_hash": "hash",
+                "qualname": "mod:f",
+                "filepath": str(f),
+                "start_line": 2,
+                "end_line": 6,
+                "size": 5,
+            },
+        ]
+    }
+    filtered, suppressed = prepare_segment_report_groups(group)
+    assert filtered == {}
+    assert suppressed == 1
+
+
+def test_segment_groups_keep_call_statement(tmp_path: Path) -> None:
+    src = "\n".join(
+        [
+            "def f():",
+            "    self.x = 1",
+            "    init()",
+            "    self.y = 2",
+        ]
+    )
+    f = tmp_path / "a.py"
+    f.write_text(src, "utf-8")
+    group = {
+        "seg|mod:f": [
+            {
+                "segment_sig": "sig",
+                "segment_hash": "hash",
+                "qualname": "mod:f",
+                "filepath": str(f),
+                "start_line": 2,
+                "end_line": 4,
+                "size": 3,
+            },
+            {
+                "segment_sig": "sig",
+                "segment_hash": "hash",
+                "qualname": "mod:f",
+                "filepath": str(f),
+                "start_line": 2,
+                "end_line": 4,
+                "size": 3,
+            },
+        ]
+    }
+    filtered, suppressed = prepare_segment_report_groups(group)
+    assert suppressed == 0
+    assert "seg|mod:f" in filtered
+
+
+def test_segment_groups_suppress_rhs_call_assigns(tmp_path: Path) -> None:
+    src = "\n".join(
+        [
+            "def f():",
+            "    self.x = init()",
+            "    self.y = factory()",
+        ]
+    )
+    f = tmp_path / "a.py"
+    f.write_text(src, "utf-8")
+    group = {
+        "seg|mod:f": [
+            {
+                "segment_sig": "sig",
+                "segment_hash": "hash",
+                "qualname": "mod:f",
+                "filepath": str(f),
+                "start_line": 2,
+                "end_line": 3,
+                "size": 2,
+            },
+            {
+                "segment_sig": "sig",
+                "segment_hash": "hash",
+                "qualname": "mod:f",
+                "filepath": str(f),
+                "start_line": 2,
+                "end_line": 3,
+                "size": 2,
+            },
+        ]
+    }
+    filtered, suppressed = prepare_segment_report_groups(group)
+    assert filtered == {}
+    assert suppressed == 1
+
+
+def test_segment_groups_keep_control_flow(tmp_path: Path) -> None:
+    src = "\n".join(
+        [
+            "def f():",
+            "    self.a = 1",
+            "    if flag:",
+            "        self.b = 2",
+            "    self.c = 3",
+        ]
+    )
+    f = tmp_path / "a.py"
+    f.write_text(src, "utf-8")
+    group = {
+        "seg|mod:f": [
+            {
+                "segment_sig": "sig",
+                "segment_hash": "hash",
+                "qualname": "mod:f",
+                "filepath": str(f),
+                "start_line": 2,
+                "end_line": 5,
+                "size": 4,
+            },
+            {
+                "segment_sig": "sig",
+                "segment_hash": "hash",
+                "qualname": "mod:f",
+                "filepath": str(f),
+                "start_line": 2,
+                "end_line": 5,
+                "size": 4,
+            },
+        ]
+    }
+    filtered, suppressed = prepare_segment_report_groups(group)
+    assert suppressed == 0
+    assert "seg|mod:f" in filtered
+
+
+def test_segment_groups_keep_min_unique_types(tmp_path: Path) -> None:
+    src = "\n".join(
+        [
+            "def f():",
+            "    self.a = 1",
+            "    x += 1",
+        ]
+    )
+    f = tmp_path / "a.py"
+    f.write_text(src, "utf-8")
+    group = {
+        "seg|mod:f": [
+            {
+                "segment_sig": "sig",
+                "segment_hash": "hash",
+                "qualname": "mod:f",
+                "filepath": str(f),
+                "start_line": 2,
+                "end_line": 3,
+                "size": 2,
+            },
+            {
+                "segment_sig": "sig",
+                "segment_hash": "hash",
+                "qualname": "mod:f",
+                "filepath": str(f),
+                "start_line": 2,
+                "end_line": 3,
+                "size": 2,
+            },
+        ]
+    }
+    filtered, suppressed = prepare_segment_report_groups(group)
+    assert suppressed == 0
+    assert "seg|mod:f" in filtered
+
+
+def test_segment_groups_deterministic(tmp_path: Path) -> None:
+    src = "\n".join(
+        [
+            "def f():",
+            "    if flag:",
+            "        x = 1",
+            "    y = 2",
+        ]
+    )
+    f = tmp_path / "a.py"
+    f.write_text(src, "utf-8")
+    group = {
+        "seg|mod:f": [
+            {
+                "segment_sig": "sig",
+                "segment_hash": "hash",
+                "qualname": "mod:f",
+                "filepath": str(f),
+                "start_line": 2,
+                "end_line": 4,
+                "size": 3,
+            },
+            {
+                "segment_sig": "sig",
+                "segment_hash": "hash",
+                "qualname": "mod:f",
+                "filepath": str(f),
+                "start_line": 2,
+                "end_line": 4,
+                "size": 3,
+            },
+        ]
+    }
+    first = prepare_segment_report_groups(group)
+    second = prepare_segment_report_groups(group)
+    assert first == second
+
+
+def test_segment_helpers_cover_edge_cases(tmp_path: Path) -> None:
+    # _merge_segment_items empty
+    assert report_mod._merge_segment_items([]) == []
+
+    # _merge_segment_items skips invalid lines and still appends trailing current
+    merged = report_mod._merge_segment_items(
+        [
+            {"start_line": 0, "end_line": 0},
+            {"start_line": 2, "end_line": 3, "filepath": "x", "qualname": "q"},
+        ]
+    )
+    assert len(merged) == 1
+
+    # _assign_targets_attribute_only
+    assign_attr = ast.parse("self.x = 1").body[0]
+    assert report_mod._assign_targets_attribute_only(assign_attr)
+    annassign_attr = ast.parse("self.y: int = 2").body[0]
+    assert report_mod._assign_targets_attribute_only(annassign_attr)
+    assign_name = ast.parse("x = 1").body[0]
+    assert not report_mod._assign_targets_attribute_only(assign_name)
+    expr_stmt = ast.parse("pass").body[0]
+    assert not report_mod._assign_targets_attribute_only(expr_stmt)
+
+    # _analyze_segment_statements empty
+    assert report_mod._analyze_segment_statements([]) is None
+
+    # _segment_statements handles non-list body and missing lineno
+    class Dummy:
+        body = None
+
+    dummy = cast(ast.FunctionDef, Dummy())
+    assert report_mod._segment_statements(dummy, 1, 2) == []
+
+    func = ast.parse("def f():\n    x = 1\n").body[0]
+    assert isinstance(func, ast.FunctionDef)
+    stmt = func.body[0]
+    delattr(stmt, "lineno")
+    assert report_mod._segment_statements(func, 1, 2) == []
+
+
+def test_segment_prepare_unknown_paths(tmp_path: Path) -> None:
+    group = {
+        "seg|mod:f": [
+            {
+                "segment_sig": "sig",
+                "segment_hash": "hash",
+                "qualname": "",
+                "filepath": "missing.py",
+                "start_line": 1,
+                "end_line": 2,
+                "size": 2,
+            }
+        ]
+    }
+    filtered, suppressed = prepare_segment_report_groups(group)
+    assert suppressed == 0
+    assert "seg|mod:f" in filtered
+
+
+def test_segment_prepare_empty_merge() -> None:
+    group = {
+        "seg|mod:f": [
+            {
+                "segment_sig": "sig",
+                "segment_hash": "hash",
+                "qualname": "mod:f",
+                "filepath": "x.py",
+                "start_line": 0,
+                "end_line": 0,
+                "size": 0,
+            }
+        ]
+    }
+    filtered, suppressed = prepare_segment_report_groups(group)
+    assert suppressed == 0
+    assert filtered == {}
+
+
+def test_segment_prepare_missing_file(tmp_path: Path) -> None:
+    group = {
+        "seg|mod:f": [
+            {
+                "segment_sig": "sig",
+                "segment_hash": "hash",
+                "qualname": "mod:f",
+                "filepath": str(tmp_path / "missing.py"),
+                "start_line": 1,
+                "end_line": 2,
+                "size": 2,
+            }
+        ]
+    }
+    filtered, suppressed = prepare_segment_report_groups(group)
+    assert suppressed == 0
+    assert "seg|mod:f" in filtered
+
+
+@pytest.mark.parametrize(
+    ("case", "start_line", "end_line"),
+    [
+        ("syntax_error", 1, 2),
+        ("missing_function", 1, 2),
+        ("empty_range", 10, 12),
+    ],
+)
+def test_segment_prepare_unresolvable_cases(
+    tmp_path: Path, case: str, start_line: int, end_line: int
+) -> None:
+    if case == "syntax_error":
+        f = tmp_path / "bad.py"
+        f.write_text("def f(:\n    pass\n", "utf-8")
+    elif case == "missing_function":
+        f = tmp_path / "a.py"
+        f.write_text("def g():\n    return 1\n", "utf-8")
+    else:
+        f = tmp_path / "a.py"
+        f.write_text("def f():\n    x = 1\n", "utf-8")
+
+    group = {
+        "seg|mod:f": [
+            {
+                "segment_sig": "sig",
+                "segment_hash": "hash",
+                "qualname": "mod:f",
+                "filepath": str(f),
+                "start_line": start_line,
+                "end_line": end_line,
+                "size": 2,
+            }
+        ]
+    }
+    filtered, suppressed = prepare_segment_report_groups(group)
+    assert suppressed == 0
+    assert "seg|mod:f" in filtered
+
+
+def test_collect_file_functions_class_and_async(tmp_path: Path) -> None:
+    src = "\n".join(
+        [
+            "class C:",
+            "    async def a(self):",
+            "        return 1",
+        ]
+    )
+    f = tmp_path / "a.py"
+    f.write_text(src, "utf-8")
+    funcs = report_mod._collect_file_functions(str(f))
+    assert funcs is not None
+    assert "C.a" in funcs
+
+    segments = [
+        {
+            "segment_sig": "sig2",
+            "segment_hash": "h1",
+            "qualname": "mod:f",
+            "filepath": "a.py",
+            "start_line": 1,
+            "end_line": 2,
+            "size": 2,
+        },
+        {
+            "segment_sig": "sig2",
+            "segment_hash": "h2",
+            "qualname": "mod:f",
+            "filepath": "a.py",
+            "start_line": 3,
+            "end_line": 4,
+            "size": 2,
+        },
+    ]
+    groups = build_segment_groups(segments)
+    assert groups == {}
diff --git a/tests/test_scanner_extra.py b/tests/test_scanner_extra.py
index 80ec544..4b95154 100644
--- a/tests/test_scanner_extra.py
+++ b/tests/test_scanner_extra.py
@@ -1,5 +1,6 @@
 from __future__ import annotations
 
+import os
 from pathlib import Path
 
 import pytest
@@ -9,6 +10,17 @@
 from codeclone.scanner import iter_py_files, module_name_from_path
 
 
+def _symlink_or_skip(
+    link: Path, target: Path, *, target_is_directory: bool = False
+) -> None:
+    if not hasattr(os, "symlink"):
+        pytest.skip("symlink is not supported on this platform")
+    try:
+        link.symlink_to(target, target_is_directory=target_is_directory)
+    except (OSError, NotImplementedError):
+        pytest.skip("symlink creation is not available in this environment")
+
+
 def test_iter_py_files_in_temp(tmp_path: Path) -> None:
     src = tmp_path / "a.py"
     src.write_text("def f():\n    return 1\n", "utf-8")
@@ -32,6 +44,18 @@ def test_iter_py_files_excludes(tmp_path: Path) -> None:
     assert str(skip) not in files
 
 
+def test_iter_py_files_deterministic_sorted_order(tmp_path: Path) -> None:
+    z_file = tmp_path / "z.py"
+    z_file.write_text("z = 1\n", "utf-8")
+    a_dir = tmp_path / "pkg"
+    a_dir.mkdir()
+    a_file = a_dir / "a.py"
+    a_file.write_text("a = 1\n", "utf-8")
+
+    files = list(iter_py_files(str(tmp_path)))
+    assert files == sorted(files)
+
+
 def test_module_name_from_path(tmp_path: Path) -> None:
     pkg = tmp_path / "pkg"
     pkg.mkdir()
@@ -73,12 +97,38 @@ def test_iter_py_files_symlink_skip(tmp_path: Path) -> None:
     root = tmp_path / "root"
     root.mkdir()
     link = root / "link.py"
-    link.symlink_to(out_file)
+    _symlink_or_skip(link, out_file)
+
+    files = list(iter_py_files(str(root)))
+    assert str(link) not in files
+
+
+def test_iter_py_files_symlink_to_etc_skipped(tmp_path: Path) -> None:
+    passwd = Path("/etc/passwd")
+    if not passwd.exists():
+        pytest.skip("/etc/passwd not available")
+
+    root = tmp_path / "root"
+    root.mkdir()
+    link = root / "passwd.py"
+    _symlink_or_skip(link, passwd)
 
     files = list(iter_py_files(str(root)))
     assert str(link) not in files
 
 
+def test_iter_py_files_symlink_loop_does_not_traverse(tmp_path: Path) -> None:
+    root = tmp_path / "root"
+    root.mkdir()
+    src = root / "a.py"
+    src.write_text("x = 1\n", "utf-8")
+    loop = root / "loop"
+    _symlink_or_skip(loop, root, target_is_directory=True)
+
+    files = list(iter_py_files(str(root), max_files=10))
+    assert files.count(str(src)) == 1
+
+
 def test_sensitive_prefix_blocked(
     tmp_path: Path, monkeypatch: pytest.MonkeyPatch
 ) -> None:
@@ -149,7 +199,7 @@ def test_symlink_to_sensitive_directory_skipped(
         monkeypatch.setattr(scanner, "SENSITIVE_DIRS", {str(sensitive_root)})
 
         link = root / "sensitive_link"
-        link.symlink_to(sensitive_root, target_is_directory=True)
+        _symlink_or_skip(link, sensitive_root, target_is_directory=True)
 
         files = list(scanner.iter_py_files(str(root)))
         assert str(sensitive_file) not in files
diff --git a/tests/test_security.py b/tests/test_security.py
index a702fe2..56d0b00 100644
--- a/tests/test_security.py
+++ b/tests/test_security.py
@@ -1,11 +1,13 @@
 import os
 import tempfile
+from pathlib import Path
 from unittest.mock import patch
 
 import pytest
 
 from codeclone.cli import MAX_FILE_SIZE, process_file
 from codeclone.errors import ValidationError
+from codeclone.html_report import build_html_report
 from codeclone.normalize import NormalizationConfig
 from codeclone.scanner import iter_py_files
 
@@ -42,3 +44,39 @@ def test_process_file_size_limit() -> None:
 
     finally:
         os.remove(tmp_path)
+
+
+def test_html_report_escapes_user_content(tmp_path: Path) -> None:
+    bad_path = tmp_path / 'x" onmouseover="alert(1).py'
+    good_path = tmp_path / "y.py"
+    bad_path.write_text("def f():\n    return 1\n", "utf-8")
+    good_path.write_text("def g():\n    return 2\n", "utf-8")
+    func_groups = {
+        "k": [
+            {
+                "qualname": "<script>alert(1)</script>",
+                "filepath": str(bad_path),
+                "start_line": 1,
+                "end_line": 2,
+                "loc": 2,
+            },
+            {
+                "qualname": "ok",
+                "filepath": str(good_path),
+                "start_line": 3,
+                "end_line": 4,
+                "loc": 2,
+            },
+        ]
+    }
+    html = build_html_report(
+        func_groups=func_groups,
+        block_groups={},
+        segment_groups={},
+        title="Security",
+    )
+    assert "<script>alert(1)</script>" not in html
+    assert "&lt;script&gt;alert(1)&lt;/script&gt;" in html
+    assert 'onmouseover="alert(1)' not in html
+    assert 'data-qualname="&lt;script&gt;alert(1)&lt;/script&gt;"' in html
+    assert "&quot; onmouseover=&quot;alert(1).py" in html
diff --git a/tests/test_segments.py b/tests/test_segments.py
new file mode 100644
index 0000000..6e2ab63
--- /dev/null
+++ b/tests/test_segments.py
@@ -0,0 +1,105 @@
+import ast
+
+from codeclone.blocks import extract_segments
+from codeclone.normalize import NormalizationConfig
+
+
+def test_extract_segments_windows() -> None:
+    src = """
+def f():
+    a = 1
+    b = 2
+    c = 3
+"""
+    func = ast.parse(src).body[0]
+    assert isinstance(func, ast.FunctionDef)
+    segments = extract_segments(
+        func,
+        filepath="x.py",
+        qualname="mod:f",
+        cfg=NormalizationConfig(),
+        window_size=2,
+        max_segments=10,
+    )
+    assert len(segments) == 2
+    assert segments[0].size == 2
+
+
+def test_extract_segments_short_function() -> None:
+    src = """
+def f():
+    a = 1
+"""
+    func = ast.parse(src).body[0]
+    assert isinstance(func, ast.FunctionDef)
+    segments = extract_segments(
+        func,
+        filepath="x.py",
+        qualname="mod:f",
+        cfg=NormalizationConfig(),
+        window_size=3,
+        max_segments=10,
+    )
+    assert segments == []
+
+
+def test_extract_segments_missing_lineno_and_max_limit() -> None:
+    src = """
+def f():
+    a = 1
+    b = 2
+    c = 3
+    d = 4
+"""
+    func = ast.parse(src).body[0]
+    assert isinstance(func, ast.FunctionDef)
+    func.body[0].lineno = 0
+    segments = extract_segments(
+        func,
+        filepath="x.py",
+        qualname="mod:f",
+        cfg=NormalizationConfig(),
+        window_size=2,
+        max_segments=1,
+    )
+    assert len(segments) == 1
+
+
+def test_extract_segments_signature_orderless() -> None:
+    src1 = """
+def f():
+    a = 1
+    b = 2
+"""
+    src2 = """
+def f():
+    b = 2
+    a = 1
+"""
+    func1 = ast.parse(src1).body[0]
+    func2 = ast.parse(src2).body[0]
+    assert isinstance(func1, ast.FunctionDef)
+    assert isinstance(func2, ast.FunctionDef)
+    cfg = NormalizationConfig(
+        normalize_names=False,
+        normalize_attributes=False,
+        normalize_constants=False,
+    )
+    seg1 = extract_segments(
+        func1,
+        filepath="x.py",
+        qualname="mod:f",
+        cfg=cfg,
+        window_size=2,
+        max_segments=10,
+    )[0]
+    seg2 = extract_segments(
+        func2,
+        filepath="x.py",
+        qualname="mod:f",
+        cfg=cfg,
+        window_size=2,
+        max_segments=10,
+    )[0]
+    assert seg1.segment_sig == seg2.segment_sig
+    assert seg1.segment_hash != seg2.segment_hash
diff --git a/uv.lock b/uv.lock
index e92a282..611e943 100644
--- a/uv.lock
+++ b/uv.lock
@@ -89,6 +89,15 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/e1/5e/b666bacbbc60fbf415ba9988324a132c9a7a0448a9a8f125074671c0f2c3/cffi-2.0.0-cp314-cp314t-musllinux_1_2_x86_64.whl", hash = "sha256:6c6c373cfc5c83a975506110d17457138c8c63016b563cc9ed6e056a82f13ce4", size = 223437, upload-time = "2025-09-08T23:23:38.945Z" },
 ]
 
+[[package]]
+name = "cfgv"
+version = "3.5.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/4e/b5/721b8799b04bf9afe054a3899c6cf4e880fcf8563cc71c15610242490a0c/cfgv-3.5.0.tar.gz", hash = "sha256:d5b1034354820651caa73ede66a6294d6e95c1b00acc5e9b098e917404669132", size = 7334, upload-time = "2025-11-19T20:55:51.612Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/db/3c/33bac158f8ab7f89b2e59426d5fe2e4f63f7ed25df84c036890172b412b5/cfgv-3.5.0-py2.py3-none-any.whl", hash = "sha256:a8dc6b26ad22ff227d2634a65cb388215ce6cc96bbcc5cfde7641ae87e8dacc0", size = 7445, upload-time = "2025-11-19T20:55:50.744Z" },
+]
+
 [[package]]
 name = "charset-normalizer"
 version = "3.4.4"
@@ -180,7 +189,7 @@ wheels = [
 
 [[package]]
 name = "codeclone"
-version = "1.2.1"
+version = "1.3.0"
 source = { editable = "." }
 dependencies = [
     { name = "pygments" },
@@ -191,6 +200,7 @@ dependencies = [
 dev = [
     { name = "build" },
     { name = "mypy" },
+    { name = "pre-commit" },
     { name = "pytest" },
     { name = "pytest-cov" },
     { name = "ruff" },
@@ -201,11 +211,12 @@ dev = [
 requires-dist = [
     { name = "build", marker = "extra == 'dev'", specifier = ">=1.2.0" },
     { name = "mypy", marker = "extra == 'dev'", specifier = ">=1.19.1" },
+    { name = "pre-commit", marker = "extra == 'dev'", specifier = ">=4.5.1" },
     { name = "pygments", specifier = ">=2.19.2" },
     { name = "pytest", marker = "extra == 'dev'", specifier = ">=9.0.0" },
     { name = "pytest-cov", marker = "extra == 'dev'", specifier = ">=6.1.0" },
     { name = "rich", specifier = ">=14.3.2" },
-    { name = "ruff", marker = "extra == 'dev'", specifier = ">=0.12.0" },
+    { name = "ruff", marker = "extra == 'dev'", specifier = ">=0.15.0" },
     { name = "twine", marker = "extra == 'dev'", specifier = ">=5.0.0" },
 ]
 provides-extras = ["dev"]
@@ -372,6 +383,15 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/81/8e/bf4a0de294f147fee66f879d9bae6f8e8d61515558e3d12785dd90eca0be/cryptography-46.0.4-pp311-pypy311_pp73-manylinux_2_34_x86_64.whl", hash = "sha256:44cc0675b27cadb71bdbb96099cca1fa051cd11d2ade09e5cd3a2edb929ed947", size = 4382025, upload-time = "2026-01-28T00:24:30.681Z" },
 ]
 
+[[package]]
+name = "distlib"
+version = "0.4.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/96/8e/709914eb2b5749865801041647dc7f4e6d00b549cfe88b65ca192995f07c/distlib-0.4.0.tar.gz", hash = "sha256:feec40075be03a04501a973d81f633735b4b69f98b05450592310c0f401a4e0d", size = 614605, upload-time = "2025-07-17T16:52:00.465Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/33/6b/e0547afaf41bf2c42e52430072fa5658766e3d65bd4b03a563d1b6336f57/distlib-0.4.0-py2.py3-none-any.whl", hash = "sha256:9659f7d87e46584a30b5780e43ac7a2143098441670ff0a49d5f9034c54a6c16", size = 469047, upload-time = "2025-07-17T16:51:58.613Z" },
+]
+
 [[package]]
 name = "docutils"
 version = "0.22.4"
@@ -393,6 +413,15 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/8a/0e/97c33bf5009bdbac74fd2beace167cab3f978feb69cc36f1ef79360d6c4e/exceptiongroup-1.3.1-py3-none-any.whl", hash = "sha256:a7a39a3bd276781e98394987d3a5701d0c4edffb633bb7a5144577f82c773598", size = 16740, upload-time = "2025-11-21T23:01:53.443Z" },
 ]
 
+[[package]]
+name = "filelock"
+version = "3.20.3"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/1d/65/ce7f1b70157833bf3cb851b556a37d4547ceafc158aa9b34b36782f23696/filelock-3.20.3.tar.gz", hash = "sha256:18c57ee915c7ec61cff0ecf7f0f869936c7c30191bb0cf406f1341778d0834e1", size = 19485, upload-time = "2026-01-09T17:55:05.421Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/b5/36/7fb70f04bf00bc646cd5bb45aa9eddb15e19437a28b8fb2b4a5249fac770/filelock-3.20.3-py3-none-any.whl", hash = "sha256:4b0dda527ee31078689fc205ec4f1c1bf7d56cf88b6dc9426c4f230e46c2dce1", size = 16701, upload-time = "2026-01-09T17:55:04.334Z" },
+]
+
 [[package]]
 name = "id"
 version = "1.5.0"
@@ -405,6 +434,15 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/9f/cb/18326d2d89ad3b0dd143da971e77afd1e6ca6674f1b1c3df4b6bec6279fc/id-1.5.0-py3-none-any.whl", hash = "sha256:f1434e1cef91f2cbb8a4ec64663d5a23b9ed43ef44c4c957d02583d61714c658", size = 13611, upload-time = "2024-12-04T19:53:03.02Z" },
 ]
 
+[[package]]
+name = "identify"
+version = "2.6.16"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/5b/8d/e8b97e6bd3fb6fb271346f7981362f1e04d6a7463abd0de79e1fda17c067/identify-2.6.16.tar.gz", hash = "sha256:846857203b5511bbe94d5a352a48ef2359532bc8f6727b5544077a0dcfb24980", size = 99360, upload-time = "2026-01-12T18:58:58.201Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/b8/58/40fbbcefeda82364720eba5cf2270f98496bdfa19ea75b4cccae79c698e6/identify-2.6.16-py2.py3-none-any.whl", hash = "sha256:391ee4d77741d994189522896270b787aed8670389bfd60f326d677d64a6dfb0", size = 99202, upload-time = "2026-01-12T18:58:56.627Z" },
+]
+
 [[package]]
 name = "idna"
 version = "3.11"
@@ -689,6 +727,15 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/9e/7e/a96255f63b7aef032cbee8fc4d6e37def72e3aaedc1f72759235e8f13cb1/nh3-0.3.2-cp38-abi3-win_arm64.whl", hash = "sha256:cf5964d54edd405e68583114a7cba929468bcd7db5e676ae38ee954de1cfc104", size = 584162, upload-time = "2025-10-30T11:17:44.96Z" },
 ]
 
+[[package]]
+name = "nodeenv"
+version = "1.10.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/24/bf/d1bda4f6168e0b2e9e5958945e01910052158313224ada5ce1fb2e1113b8/nodeenv-1.10.0.tar.gz", hash = "sha256:996c191ad80897d076bdfba80a41994c2b47c68e224c542b48feba42ba00f8bb", size = 55611, upload-time = "2025-12-20T14:08:54.006Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/88/b2/d0896bdcdc8d28a7fc5717c305f1a861c26e18c05047949fb371034d98bd/nodeenv-1.10.0-py2.py3-none-any.whl", hash = "sha256:5bb13e3eed2923615535339b3c620e76779af4cb4c6a90deccc9e36b274d3827", size = 23438, upload-time = "2025-12-20T14:08:52.782Z" },
+]
+
 [[package]]
 name = "packaging"
 version = "26.0"
@@ -707,6 +754,15 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/ef/3c/2c197d226f9ea224a9ab8d197933f9da0ae0aac5b6e0f884e2b8d9c8e9f7/pathspec-1.0.4-py3-none-any.whl", hash = "sha256:fb6ae2fd4e7c921a165808a552060e722767cfa526f99ca5156ed2ce45a5c723", size = 55206, upload-time = "2026-01-27T03:59:45.137Z" },
 ]
 
+[[package]]
+name = "platformdirs"
+version = "4.5.1"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/cf/86/0248f086a84f01b37aaec0fa567b397df1a119f73c16f6c7a9aac73ea309/platformdirs-4.5.1.tar.gz", hash = "sha256:61d5cdcc6065745cdd94f0f878977f8de9437be93de97c1c12f853c9c0cdcbda", size = 21715, upload-time = "2025-12-05T13:52:58.638Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/cb/28/3bfe2fa5a7b9c46fe7e13c97bda14c895fb10fa2ebf1d0abb90e0cea7ee1/platformdirs-4.5.1-py3-none-any.whl", hash = "sha256:d03afa3963c806a9bed9d5125c8f4cb2fdaf74a55ab60e5d59b3fde758104d31", size = 18731, upload-time = "2025-12-05T13:52:56.823Z" },
+]
+
 [[package]]
 name = "pluggy"
 version = "1.6.0"
@@ -716,6 +772,22 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/54/20/4d324d65cc6d9205fabedc306948156824eb9f0ee1633355a8f7ec5c66bf/pluggy-1.6.0-py3-none-any.whl", hash = "sha256:e920276dd6813095e9377c0bc5566d94c932c33b27a3e3945d8389c374dd4746", size = 20538, upload-time = "2025-05-15T12:30:06.134Z" },
 ]
 
+[[package]]
+name = "pre-commit"
+version = "4.5.1"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "cfgv" },
+    { name = "identify" },
+    { name = "nodeenv" },
+    { name = "pyyaml" },
+    { name = "virtualenv" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/40/f1/6d86a29246dfd2e9b6237f0b5823717f60cad94d47ddc26afa916d21f525/pre_commit-4.5.1.tar.gz", hash = "sha256:eb545fcff725875197837263e977ea257a402056661f09dae08e4b149b030a61", size = 198232, upload-time = "2025-12-16T21:14:33.552Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/5d/19/fd3ef348460c80af7bb4669ea7926651d1f95c23ff2df18b9d24bab4f3fa/pre_commit-4.5.1-py2.py3-none-any.whl", hash = "sha256:3b3afd891e97337708c1674210f8eba659b52a38ea5f822ff142d10786221f77", size = 226437, upload-time = "2025-12-16T21:14:32.409Z" },
+]
+
 [[package]]
 name = "pycparser"
 version = "3.0"
@@ -784,6 +856,70 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/de/3d/8161f7711c017e01ac9f008dfddd9410dff3674334c233bde66e7ba65bbf/pywin32_ctypes-0.2.3-py3-none-any.whl", hash = "sha256:8a1513379d709975552d202d942d9837758905c8d01eb82b8bcc30918929e7b8", size = 30756, upload-time = "2024-08-14T10:15:33.187Z" },
 ]
 
+[[package]]
+name = "pyyaml"
+version = "6.0.3"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/05/8e/961c0007c59b8dd7729d542c61a4d537767a59645b82a0b521206e1e25c2/pyyaml-6.0.3.tar.gz", hash = "sha256:d76623373421df22fb4cf8817020cbb7ef15c725b9d5e45f17e189bfc384190f", size = 130960, upload-time = "2025-09-25T21:33:16.546Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/f4/a0/39350dd17dd6d6c6507025c0e53aef67a9293a6d37d3511f23ea510d5800/pyyaml-6.0.3-cp310-cp310-macosx_10_13_x86_64.whl", hash = "sha256:214ed4befebe12df36bcc8bc2b64b396ca31be9304b8f59e25c11cf94a4c033b", size = 184227, upload-time = "2025-09-25T21:31:46.04Z" },
+    { url = "https://files.pythonhosted.org/packages/05/14/52d505b5c59ce73244f59c7a50ecf47093ce4765f116cdb98286a71eeca2/pyyaml-6.0.3-cp310-cp310-macosx_11_0_arm64.whl", hash = "sha256:02ea2dfa234451bbb8772601d7b8e426c2bfa197136796224e50e35a78777956", size = 174019, upload-time = "2025-09-25T21:31:47.706Z" },
+    { url = "https://files.pythonhosted.org/packages/43/f7/0e6a5ae5599c838c696adb4e6330a59f463265bfa1e116cfd1fbb0abaaae/pyyaml-6.0.3-cp310-cp310-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:b30236e45cf30d2b8e7b3e85881719e98507abed1011bf463a8fa23e9c3e98a8", size = 740646, upload-time = "2025-09-25T21:31:49.21Z" },
+    { url = "https://files.pythonhosted.org/packages/2f/3a/61b9db1d28f00f8fd0ae760459a5c4bf1b941baf714e207b6eb0657d2578/pyyaml-6.0.3-cp310-cp310-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:66291b10affd76d76f54fad28e22e51719ef9ba22b29e1d7d03d6777a9174198", size = 840793, upload-time = "2025-09-25T21:31:50.735Z" },
+    { url = "https://files.pythonhosted.org/packages/7a/1e/7acc4f0e74c4b3d9531e24739e0ab832a5edf40e64fbae1a9c01941cabd7/pyyaml-6.0.3-cp310-cp310-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:9c7708761fccb9397fe64bbc0395abcae8c4bf7b0eac081e12b809bf47700d0b", size = 770293, upload-time = "2025-09-25T21:31:51.828Z" },
+    { url = "https://files.pythonhosted.org/packages/8b/ef/abd085f06853af0cd59fa5f913d61a8eab65d7639ff2a658d18a25d6a89d/pyyaml-6.0.3-cp310-cp310-musllinux_1_2_aarch64.whl", hash = "sha256:418cf3f2111bc80e0933b2cd8cd04f286338bb88bdc7bc8e6dd775ebde60b5e0", size = 732872, upload-time = "2025-09-25T21:31:53.282Z" },
+    { url = "https://files.pythonhosted.org/packages/1f/15/2bc9c8faf6450a8b3c9fc5448ed869c599c0a74ba2669772b1f3a0040180/pyyaml-6.0.3-cp310-cp310-musllinux_1_2_x86_64.whl", hash = "sha256:5e0b74767e5f8c593e8c9b5912019159ed0533c70051e9cce3e8b6aa699fcd69", size = 758828, upload-time = "2025-09-25T21:31:54.807Z" },
+    { url = "https://files.pythonhosted.org/packages/a3/00/531e92e88c00f4333ce359e50c19b8d1de9fe8d581b1534e35ccfbc5f393/pyyaml-6.0.3-cp310-cp310-win32.whl", hash = "sha256:28c8d926f98f432f88adc23edf2e6d4921ac26fb084b028c733d01868d19007e", size = 142415, upload-time = "2025-09-25T21:31:55.885Z" },
+    { url = "https://files.pythonhosted.org/packages/2a/fa/926c003379b19fca39dd4634818b00dec6c62d87faf628d1394e137354d4/pyyaml-6.0.3-cp310-cp310-win_amd64.whl", hash = "sha256:bdb2c67c6c1390b63c6ff89f210c8fd09d9a1217a465701eac7316313c915e4c", size = 158561, upload-time = "2025-09-25T21:31:57.406Z" },
+    { url = "https://files.pythonhosted.org/packages/6d/16/a95b6757765b7b031c9374925bb718d55e0a9ba8a1b6a12d25962ea44347/pyyaml-6.0.3-cp311-cp311-macosx_10_13_x86_64.whl", hash = "sha256:44edc647873928551a01e7a563d7452ccdebee747728c1080d881d68af7b997e", size = 185826, upload-time = "2025-09-25T21:31:58.655Z" },
+    { url = "https://files.pythonhosted.org/packages/16/19/13de8e4377ed53079ee996e1ab0a9c33ec2faf808a4647b7b4c0d46dd239/pyyaml-6.0.3-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:652cb6edd41e718550aad172851962662ff2681490a8a711af6a4d288dd96824", size = 175577, upload-time = "2025-09-25T21:32:00.088Z" },
+    { url = "https://files.pythonhosted.org/packages/0c/62/d2eb46264d4b157dae1275b573017abec435397aa59cbcdab6fc978a8af4/pyyaml-6.0.3-cp311-cp311-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:10892704fc220243f5305762e276552a0395f7beb4dbf9b14ec8fd43b57f126c", size = 775556, upload-time = "2025-09-25T21:32:01.31Z" },
+    { url = "https://files.pythonhosted.org/packages/10/cb/16c3f2cf3266edd25aaa00d6c4350381c8b012ed6f5276675b9eba8d9ff4/pyyaml-6.0.3-cp311-cp311-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:850774a7879607d3a6f50d36d04f00ee69e7fc816450e5f7e58d7f17f1ae5c00", size = 882114, upload-time = "2025-09-25T21:32:03.376Z" },
+    { url = "https://files.pythonhosted.org/packages/71/60/917329f640924b18ff085ab889a11c763e0b573da888e8404ff486657602/pyyaml-6.0.3-cp311-cp311-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:b8bb0864c5a28024fac8a632c443c87c5aa6f215c0b126c449ae1a150412f31d", size = 806638, upload-time = "2025-09-25T21:32:04.553Z" },
+    { url = "https://files.pythonhosted.org/packages/dd/6f/529b0f316a9fd167281a6c3826b5583e6192dba792dd55e3203d3f8e655a/pyyaml-6.0.3-cp311-cp311-musllinux_1_2_aarch64.whl", hash = "sha256:1d37d57ad971609cf3c53ba6a7e365e40660e3be0e5175fa9f2365a379d6095a", size = 767463, upload-time = "2025-09-25T21:32:06.152Z" },
+    { url = "https://files.pythonhosted.org/packages/f2/6a/b627b4e0c1dd03718543519ffb2f1deea4a1e6d42fbab8021936a4d22589/pyyaml-6.0.3-cp311-cp311-musllinux_1_2_x86_64.whl", hash = "sha256:37503bfbfc9d2c40b344d06b2199cf0e96e97957ab1c1b546fd4f87e53e5d3e4", size = 794986, upload-time = "2025-09-25T21:32:07.367Z" },
+    { url = "https://files.pythonhosted.org/packages/45/91/47a6e1c42d9ee337c4839208f30d9f09caa9f720ec7582917b264defc875/pyyaml-6.0.3-cp311-cp311-win32.whl", hash = "sha256:8098f252adfa6c80ab48096053f512f2321f0b998f98150cea9bd23d83e1467b", size = 142543, upload-time = "2025-09-25T21:32:08.95Z" },
+    { url = "https://files.pythonhosted.org/packages/da/e3/ea007450a105ae919a72393cb06f122f288ef60bba2dc64b26e2646fa315/pyyaml-6.0.3-cp311-cp311-win_amd64.whl", hash = "sha256:9f3bfb4965eb874431221a3ff3fdcddc7e74e3b07799e0e84ca4a0f867d449bf", size = 158763, upload-time = "2025-09-25T21:32:09.96Z" },
+    { url = "https://files.pythonhosted.org/packages/d1/33/422b98d2195232ca1826284a76852ad5a86fe23e31b009c9886b2d0fb8b2/pyyaml-6.0.3-cp312-cp312-macosx_10_13_x86_64.whl", hash = "sha256:7f047e29dcae44602496db43be01ad42fc6f1cc0d8cd6c83d342306c32270196", size = 182063, upload-time = "2025-09-25T21:32:11.445Z" },
+    { url = "https://files.pythonhosted.org/packages/89/a0/6cf41a19a1f2f3feab0e9c0b74134aa2ce6849093d5517a0c550fe37a648/pyyaml-6.0.3-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:fc09d0aa354569bc501d4e787133afc08552722d3ab34836a80547331bb5d4a0", size = 173973, upload-time = "2025-09-25T21:32:12.492Z" },
+    { url = "https://files.pythonhosted.org/packages/ed/23/7a778b6bd0b9a8039df8b1b1d80e2e2ad78aa04171592c8a5c43a56a6af4/pyyaml-6.0.3-cp312-cp312-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:9149cad251584d5fb4981be1ecde53a1ca46c891a79788c0df828d2f166bda28", size = 775116, upload-time = "2025-09-25T21:32:13.652Z" },
+    { url = "https://files.pythonhosted.org/packages/65/30/d7353c338e12baef4ecc1b09e877c1970bd3382789c159b4f89d6a70dc09/pyyaml-6.0.3-cp312-cp312-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:5fdec68f91a0c6739b380c83b951e2c72ac0197ace422360e6d5a959d8d97b2c", size = 844011, upload-time = "2025-09-25T21:32:15.21Z" },
+    { url = "https://files.pythonhosted.org/packages/8b/9d/b3589d3877982d4f2329302ef98a8026e7f4443c765c46cfecc8858c6b4b/pyyaml-6.0.3-cp312-cp312-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:ba1cc08a7ccde2d2ec775841541641e4548226580ab850948cbfda66a1befcdc", size = 807870, upload-time = "2025-09-25T21:32:16.431Z" },
+    { url = "https://files.pythonhosted.org/packages/05/c0/b3be26a015601b822b97d9149ff8cb5ead58c66f981e04fedf4e762f4bd4/pyyaml-6.0.3-cp312-cp312-musllinux_1_2_aarch64.whl", hash = "sha256:8dc52c23056b9ddd46818a57b78404882310fb473d63f17b07d5c40421e47f8e", size = 761089, upload-time = "2025-09-25T21:32:17.56Z" },
+    { url = "https://files.pythonhosted.org/packages/be/8e/98435a21d1d4b46590d5459a22d88128103f8da4c2d4cb8f14f2a96504e1/pyyaml-6.0.3-cp312-cp312-musllinux_1_2_x86_64.whl", hash = "sha256:41715c910c881bc081f1e8872880d3c650acf13dfa8214bad49ed4cede7c34ea", size = 790181, upload-time = "2025-09-25T21:32:18.834Z" },
+    { url = "https://files.pythonhosted.org/packages/74/93/7baea19427dcfbe1e5a372d81473250b379f04b1bd3c4c5ff825e2327202/pyyaml-6.0.3-cp312-cp312-win32.whl", hash = "sha256:96b533f0e99f6579b3d4d4995707cf36df9100d67e0c8303a0c55b27b5f99bc5", size = 137658, upload-time = "2025-09-25T21:32:20.209Z" },
+    { url = "https://files.pythonhosted.org/packages/86/bf/899e81e4cce32febab4fb42bb97dcdf66bc135272882d1987881a4b519e9/pyyaml-6.0.3-cp312-cp312-win_amd64.whl", hash = "sha256:5fcd34e47f6e0b794d17de1b4ff496c00986e1c83f7ab2fb8fcfe9616ff7477b", size = 154003, upload-time = "2025-09-25T21:32:21.167Z" },
+    { url = "https://files.pythonhosted.org/packages/1a/08/67bd04656199bbb51dbed1439b7f27601dfb576fb864099c7ef0c3e55531/pyyaml-6.0.3-cp312-cp312-win_arm64.whl", hash = "sha256:64386e5e707d03a7e172c0701abfb7e10f0fb753ee1d773128192742712a98fd", size = 140344, upload-time = "2025-09-25T21:32:22.617Z" },
+    { url = "https://files.pythonhosted.org/packages/d1/11/0fd08f8192109f7169db964b5707a2f1e8b745d4e239b784a5a1dd80d1db/pyyaml-6.0.3-cp313-cp313-macosx_10_13_x86_64.whl", hash = "sha256:8da9669d359f02c0b91ccc01cac4a67f16afec0dac22c2ad09f46bee0697eba8", size = 181669, upload-time = "2025-09-25T21:32:23.673Z" },
+    { url = "https://files.pythonhosted.org/packages/b1/16/95309993f1d3748cd644e02e38b75d50cbc0d9561d21f390a76242ce073f/pyyaml-6.0.3-cp313-cp313-macosx_11_0_arm64.whl", hash = "sha256:2283a07e2c21a2aa78d9c4442724ec1eb15f5e42a723b99cb3d822d48f5f7ad1", size = 173252, upload-time = "2025-09-25T21:32:25.149Z" },
+    { url = "https://files.pythonhosted.org/packages/50/31/b20f376d3f810b9b2371e72ef5adb33879b25edb7a6d072cb7ca0c486398/pyyaml-6.0.3-cp313-cp313-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:ee2922902c45ae8ccada2c5b501ab86c36525b883eff4255313a253a3160861c", size = 767081, upload-time = "2025-09-25T21:32:26.575Z" },
+    { url = "https://files.pythonhosted.org/packages/49/1e/a55ca81e949270d5d4432fbbd19dfea5321eda7c41a849d443dc92fd1ff7/pyyaml-6.0.3-cp313-cp313-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:a33284e20b78bd4a18c8c2282d549d10bc8408a2a7ff57653c0cf0b9be0afce5", size = 841159, upload-time = "2025-09-25T21:32:27.727Z" },
+    { url = "https://files.pythonhosted.org/packages/74/27/e5b8f34d02d9995b80abcef563ea1f8b56d20134d8f4e5e81733b1feceb2/pyyaml-6.0.3-cp313-cp313-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:0f29edc409a6392443abf94b9cf89ce99889a1dd5376d94316ae5145dfedd5d6", size = 801626, upload-time = "2025-09-25T21:32:28.878Z" },
+    { url = "https://files.pythonhosted.org/packages/f9/11/ba845c23988798f40e52ba45f34849aa8a1f2d4af4b798588010792ebad6/pyyaml-6.0.3-cp313-cp313-musllinux_1_2_aarch64.whl", hash = "sha256:f7057c9a337546edc7973c0d3ba84ddcdf0daa14533c2065749c9075001090e6", size = 753613, upload-time = "2025-09-25T21:32:30.178Z" },
+    { url = "https://files.pythonhosted.org/packages/3d/e0/7966e1a7bfc0a45bf0a7fb6b98ea03fc9b8d84fa7f2229e9659680b69ee3/pyyaml-6.0.3-cp313-cp313-musllinux_1_2_x86_64.whl", hash = "sha256:eda16858a3cab07b80edaf74336ece1f986ba330fdb8ee0d6c0d68fe82bc96be", size = 794115, upload-time = "2025-09-25T21:32:31.353Z" },
+    { url = "https://files.pythonhosted.org/packages/de/94/980b50a6531b3019e45ddeada0626d45fa85cbe22300844a7983285bed3b/pyyaml-6.0.3-cp313-cp313-win32.whl", hash = "sha256:d0eae10f8159e8fdad514efdc92d74fd8d682c933a6dd088030f3834bc8e6b26", size = 137427, upload-time = "2025-09-25T21:32:32.58Z" },
+    { url = "https://files.pythonhosted.org/packages/97/c9/39d5b874e8b28845e4ec2202b5da735d0199dbe5b8fb85f91398814a9a46/pyyaml-6.0.3-cp313-cp313-win_amd64.whl", hash = "sha256:79005a0d97d5ddabfeeea4cf676af11e647e41d81c9a7722a193022accdb6b7c", size = 154090, upload-time = "2025-09-25T21:32:33.659Z" },
+    { url = "https://files.pythonhosted.org/packages/73/e8/2bdf3ca2090f68bb3d75b44da7bbc71843b19c9f2b9cb9b0f4ab7a5a4329/pyyaml-6.0.3-cp313-cp313-win_arm64.whl", hash = "sha256:5498cd1645aa724a7c71c8f378eb29ebe23da2fc0d7a08071d89469bf1d2defb", size = 140246, upload-time = "2025-09-25T21:32:34.663Z" },
+    { url = "https://files.pythonhosted.org/packages/9d/8c/f4bd7f6465179953d3ac9bc44ac1a8a3e6122cf8ada906b4f96c60172d43/pyyaml-6.0.3-cp314-cp314-macosx_10_13_x86_64.whl", hash = "sha256:8d1fab6bb153a416f9aeb4b8763bc0f22a5586065f86f7664fc23339fc1c1fac", size = 181814, upload-time = "2025-09-25T21:32:35.712Z" },
+    { url = "https://files.pythonhosted.org/packages/bd/9c/4d95bb87eb2063d20db7b60faa3840c1b18025517ae857371c4dd55a6b3a/pyyaml-6.0.3-cp314-cp314-macosx_11_0_arm64.whl", hash = "sha256:34d5fcd24b8445fadc33f9cf348c1047101756fd760b4dacb5c3e99755703310", size = 173809, upload-time = "2025-09-25T21:32:36.789Z" },
+    { url = "https://files.pythonhosted.org/packages/92/b5/47e807c2623074914e29dabd16cbbdd4bf5e9b2db9f8090fa64411fc5382/pyyaml-6.0.3-cp314-cp314-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:501a031947e3a9025ed4405a168e6ef5ae3126c59f90ce0cd6f2bfc477be31b7", size = 766454, upload-time = "2025-09-25T21:32:37.966Z" },
+    { url = "https://files.pythonhosted.org/packages/02/9e/e5e9b168be58564121efb3de6859c452fccde0ab093d8438905899a3a483/pyyaml-6.0.3-cp314-cp314-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:b3bc83488de33889877a0f2543ade9f70c67d66d9ebb4ac959502e12de895788", size = 836355, upload-time = "2025-09-25T21:32:39.178Z" },
+    { url = "https://files.pythonhosted.org/packages/88/f9/16491d7ed2a919954993e48aa941b200f38040928474c9e85ea9e64222c3/pyyaml-6.0.3-cp314-cp314-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:c458b6d084f9b935061bc36216e8a69a7e293a2f1e68bf956dcd9e6cbcd143f5", size = 794175, upload-time = "2025-09-25T21:32:40.865Z" },
+    { url = "https://files.pythonhosted.org/packages/dd/3f/5989debef34dc6397317802b527dbbafb2b4760878a53d4166579111411e/pyyaml-6.0.3-cp314-cp314-musllinux_1_2_aarch64.whl", hash = "sha256:7c6610def4f163542a622a73fb39f534f8c101d690126992300bf3207eab9764", size = 755228, upload-time = "2025-09-25T21:32:42.084Z" },
+    { url = "https://files.pythonhosted.org/packages/d7/ce/af88a49043cd2e265be63d083fc75b27b6ed062f5f9fd6cdc223ad62f03e/pyyaml-6.0.3-cp314-cp314-musllinux_1_2_x86_64.whl", hash = "sha256:5190d403f121660ce8d1d2c1bb2ef1bd05b5f68533fc5c2ea899bd15f4399b35", size = 789194, upload-time = "2025-09-25T21:32:43.362Z" },
+    { url = "https://files.pythonhosted.org/packages/23/20/bb6982b26a40bb43951265ba29d4c246ef0ff59c9fdcdf0ed04e0687de4d/pyyaml-6.0.3-cp314-cp314-win_amd64.whl", hash = "sha256:4a2e8cebe2ff6ab7d1050ecd59c25d4c8bd7e6f400f5f82b96557ac0abafd0ac", size = 156429, upload-time = "2025-09-25T21:32:57.844Z" },
+    { url = "https://files.pythonhosted.org/packages/f4/f4/a4541072bb9422c8a883ab55255f918fa378ecf083f5b85e87fc2b4eda1b/pyyaml-6.0.3-cp314-cp314-win_arm64.whl", hash = "sha256:93dda82c9c22deb0a405ea4dc5f2d0cda384168e466364dec6255b293923b2f3", size = 143912, upload-time = "2025-09-25T21:32:59.247Z" },
+    { url = "https://files.pythonhosted.org/packages/7c/f9/07dd09ae774e4616edf6cda684ee78f97777bdd15847253637a6f052a62f/pyyaml-6.0.3-cp314-cp314t-macosx_10_13_x86_64.whl", hash = "sha256:02893d100e99e03eda1c8fd5c441d8c60103fd175728e23e431db1b589cf5ab3", size = 189108, upload-time = "2025-09-25T21:32:44.377Z" },
+    { url = "https://files.pythonhosted.org/packages/4e/78/8d08c9fb7ce09ad8c38ad533c1191cf27f7ae1effe5bb9400a46d9437fcf/pyyaml-6.0.3-cp314-cp314t-macosx_11_0_arm64.whl", hash = "sha256:c1ff362665ae507275af2853520967820d9124984e0f7466736aea23d8611fba", size = 183641, upload-time = "2025-09-25T21:32:45.407Z" },
+    { url = "https://files.pythonhosted.org/packages/7b/5b/3babb19104a46945cf816d047db2788bcaf8c94527a805610b0289a01c6b/pyyaml-6.0.3-cp314-cp314t-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:6adc77889b628398debc7b65c073bcb99c4a0237b248cacaf3fe8a557563ef6c", size = 831901, upload-time = "2025-09-25T21:32:48.83Z" },
+    { url = "https://files.pythonhosted.org/packages/8b/cc/dff0684d8dc44da4d22a13f35f073d558c268780ce3c6ba1b87055bb0b87/pyyaml-6.0.3-cp314-cp314t-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:a80cb027f6b349846a3bf6d73b5e95e782175e52f22108cfa17876aaeff93702", size = 861132, upload-time = "2025-09-25T21:32:50.149Z" },
+    { url = "https://files.pythonhosted.org/packages/b1/5e/f77dc6b9036943e285ba76b49e118d9ea929885becb0a29ba8a7c75e29fe/pyyaml-6.0.3-cp314-cp314t-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:00c4bdeba853cc34e7dd471f16b4114f4162dc03e6b7afcc2128711f0eca823c", size = 839261, upload-time = "2025-09-25T21:32:51.808Z" },
+    { url = "https://files.pythonhosted.org/packages/ce/88/a9db1376aa2a228197c58b37302f284b5617f56a5d959fd1763fb1675ce6/pyyaml-6.0.3-cp314-cp314t-musllinux_1_2_aarch64.whl", hash = "sha256:66e1674c3ef6f541c35191caae2d429b967b99e02040f5ba928632d9a7f0f065", size = 805272, upload-time = "2025-09-25T21:32:52.941Z" },
+    { url = "https://files.pythonhosted.org/packages/da/92/1446574745d74df0c92e6aa4a7b0b3130706a4142b2d1a5869f2eaa423c6/pyyaml-6.0.3-cp314-cp314t-musllinux_1_2_x86_64.whl", hash = "sha256:16249ee61e95f858e83976573de0f5b2893b3677ba71c9dd36b9cf8be9ac6d65", size = 829923, upload-time = "2025-09-25T21:32:54.537Z" },
+    { url = "https://files.pythonhosted.org/packages/f0/7a/1c7270340330e575b92f397352af856a8c06f230aa3e76f86b39d01b416a/pyyaml-6.0.3-cp314-cp314t-win_amd64.whl", hash = "sha256:4ad1906908f2f5ae4e5a8ddfce73c320c2a1429ec52eafd27138b7f1cbe341c9", size = 174062, upload-time = "2025-09-25T21:32:55.767Z" },
+    { url = "https://files.pythonhosted.org/packages/f1/12/de94a39c2ef588c7e6455cfbe7343d3b2dc9d6b6b2f40c4c6565744c873d/pyyaml-6.0.3-cp314-cp314t-win_arm64.whl", hash = "sha256:ebc55a14a21cb14062aa4162f906cd962b28e2e9ea38f9b4391244cd8de4ae0b", size = 149341, upload-time = "2025-09-25T21:32:56.828Z" },
+]
+
 [[package]]
 name = "readme-renderer"
 version = "44.0"
@@ -849,28 +985,27 @@ wheels = [
 
 [[package]]
 name = "ruff"
-version = "0.14.14"
-source = { registry = "https://pypi.org/simple" }
-sdist = { url = "https://files.pythonhosted.org/packages/2e/06/f71e3a86b2df0dfa2d2f72195941cd09b44f87711cb7fa5193732cb9a5fc/ruff-0.14.14.tar.gz", hash = "sha256:2d0f819c9a90205f3a867dbbd0be083bee9912e170fd7d9704cc8ae45824896b", size = 4515732, upload-time = "2026-01-22T22:30:17.527Z" }
-wheels = [
-    { url = "https://files.pythonhosted.org/packages/d2/89/20a12e97bc6b9f9f68343952da08a8099c57237aef953a56b82711d55edd/ruff-0.14.14-py3-none-linux_armv6l.whl", hash = "sha256:7cfe36b56e8489dee8fbc777c61959f60ec0f1f11817e8f2415f429552846aed", size = 10467650, upload-time = "2026-01-22T22:30:08.578Z" },
-    { url = "https://files.pythonhosted.org/packages/a3/b1/c5de3fd2d5a831fcae21beda5e3589c0ba67eec8202e992388e4b17a6040/ruff-0.14.14-py3-none-macosx_10_12_x86_64.whl", hash = "sha256:6006a0082336e7920b9573ef8a7f52eec837add1265cc74e04ea8a4368cd704c", size = 10883245, upload-time = "2026-01-22T22:30:04.155Z" },
-    { url = "https://files.pythonhosted.org/packages/b8/7c/3c1db59a10e7490f8f6f8559d1db8636cbb13dccebf18686f4e3c9d7c772/ruff-0.14.14-py3-none-macosx_11_0_arm64.whl", hash = "sha256:026c1d25996818f0bf498636686199d9bd0d9d6341c9c2c3b62e2a0198b758de", size = 10231273, upload-time = "2026-01-22T22:30:34.642Z" },
-    { url = "https://files.pythonhosted.org/packages/a1/6e/5e0e0d9674be0f8581d1f5e0f0a04761203affce3232c1a1189d0e3b4dad/ruff-0.14.14-py3-none-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:f666445819d31210b71e0a6d1c01e24447a20b85458eea25a25fe8142210ae0e", size = 10585753, upload-time = "2026-01-22T22:30:31.781Z" },
-    { url = "https://files.pythonhosted.org/packages/23/09/754ab09f46ff1884d422dc26d59ba18b4e5d355be147721bb2518aa2a014/ruff-0.14.14-py3-none-manylinux_2_17_armv7l.manylinux2014_armv7l.whl", hash = "sha256:3c0f18b922c6d2ff9a5e6c3ee16259adc513ca775bcf82c67ebab7cbd9da5bc8", size = 10286052, upload-time = "2026-01-22T22:30:24.827Z" },
-    { url = "https://files.pythonhosted.org/packages/c8/cc/e71f88dd2a12afb5f50733851729d6b571a7c3a35bfdb16c3035132675a0/ruff-0.14.14-py3-none-manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:1629e67489c2dea43e8658c3dba659edbfd87361624b4040d1df04c9740ae906", size = 11043637, upload-time = "2026-01-22T22:30:13.239Z" },
-    { url = "https://files.pythonhosted.org/packages/67/b2/397245026352494497dac935d7f00f1468c03a23a0c5db6ad8fc49ca3fb2/ruff-0.14.14-py3-none-manylinux_2_17_ppc64.manylinux2014_ppc64.whl", hash = "sha256:27493a2131ea0f899057d49d303e4292b2cae2bb57253c1ed1f256fbcd1da480", size = 12194761, upload-time = "2026-01-22T22:30:22.542Z" },
-    { url = "https://files.pythonhosted.org/packages/5b/06/06ef271459f778323112c51b7587ce85230785cd64e91772034ddb88f200/ruff-0.14.14-py3-none-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:01ff589aab3f5b539e35db38425da31a57521efd1e4ad1ae08fc34dbe30bd7df", size = 12005701, upload-time = "2026-01-22T22:30:20.499Z" },
-    { url = "https://files.pythonhosted.org/packages/41/d6/99364514541cf811ccc5ac44362f88df66373e9fec1b9d1c4cc830593fe7/ruff-0.14.14-py3-none-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:1cc12d74eef0f29f51775f5b755913eb523546b88e2d733e1d701fe65144e89b", size = 11282455, upload-time = "2026-01-22T22:29:59.679Z" },
-    { url = "https://files.pythonhosted.org/packages/ca/71/37daa46f89475f8582b7762ecd2722492df26421714a33e72ccc9a84d7a5/ruff-0.14.14-py3-none-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:bb8481604b7a9e75eff53772496201690ce2687067e038b3cc31aaf16aa0b974", size = 11215882, upload-time = "2026-01-22T22:29:57.032Z" },
-    { url = "https://files.pythonhosted.org/packages/2c/10/a31f86169ec91c0705e618443ee74ede0bdd94da0a57b28e72db68b2dbac/ruff-0.14.14-py3-none-manylinux_2_31_riscv64.whl", hash = "sha256:14649acb1cf7b5d2d283ebd2f58d56b75836ed8c6f329664fa91cdea19e76e66", size = 11180549, upload-time = "2026-01-22T22:30:27.175Z" },
-    { url = "https://files.pythonhosted.org/packages/fd/1e/c723f20536b5163adf79bdd10c5f093414293cdf567eed9bdb7b83940f3f/ruff-0.14.14-py3-none-musllinux_1_2_aarch64.whl", hash = "sha256:e8058d2145566510790eab4e2fad186002e288dec5e0d343a92fe7b0bc1b3e13", size = 10543416, upload-time = "2026-01-22T22:30:01.964Z" },
-    { url = "https://files.pythonhosted.org/packages/3e/34/8a84cea7e42c2d94ba5bde1d7a4fae164d6318f13f933d92da6d7c2041ff/ruff-0.14.14-py3-none-musllinux_1_2_armv7l.whl", hash = "sha256:e651e977a79e4c758eb807f0481d673a67ffe53cfa92209781dfa3a996cf8412", size = 10285491, upload-time = "2026-01-22T22:30:29.51Z" },
-    { url = "https://files.pythonhosted.org/packages/55/ef/b7c5ea0be82518906c978e365e56a77f8de7678c8bb6651ccfbdc178c29f/ruff-0.14.14-py3-none-musllinux_1_2_i686.whl", hash = "sha256:cc8b22da8d9d6fdd844a68ae937e2a0adf9b16514e9a97cc60355e2d4b219fc3", size = 10733525, upload-time = "2026-01-22T22:30:06.499Z" },
-    { url = "https://files.pythonhosted.org/packages/6a/5b/aaf1dfbcc53a2811f6cc0a1759de24e4b03e02ba8762daabd9b6bd8c59e3/ruff-0.14.14-py3-none-musllinux_1_2_x86_64.whl", hash = "sha256:16bc890fb4cc9781bb05beb5ab4cd51be9e7cb376bf1dd3580512b24eb3fda2b", size = 11315626, upload-time = "2026-01-22T22:30:36.848Z" },
-    { url = "https://files.pythonhosted.org/packages/2c/aa/9f89c719c467dfaf8ad799b9bae0df494513fb21d31a6059cb5870e57e74/ruff-0.14.14-py3-none-win32.whl", hash = "sha256:b530c191970b143375b6a68e6f743800b2b786bbcf03a7965b06c4bf04568167", size = 10502442, upload-time = "2026-01-22T22:30:38.93Z" },
-    { url = "https://files.pythonhosted.org/packages/87/44/90fa543014c45560cae1fffc63ea059fb3575ee6e1cb654562197e5d16fb/ruff-0.14.14-py3-none-win_amd64.whl", hash = "sha256:3dde1435e6b6fe5b66506c1dff67a421d0b7f6488d466f651c07f4cab3bf20fd", size = 11630486, upload-time = "2026-01-22T22:30:10.852Z" },
-    { url = "https://files.pythonhosted.org/packages/9e/6a/40fee331a52339926a92e17ae748827270b288a35ef4a15c9c8f2ec54715/ruff-0.14.14-py3-none-win_arm64.whl", hash = "sha256:56e6981a98b13a32236a72a8da421d7839221fa308b223b9283312312e5ac76c", size = 10920448, upload-time = "2026-01-22T22:30:15.417Z" },
+version = "0.15.0"
+source = { registry = "https://pypi.org/simple" }
+sdist = { url = "https://files.pythonhosted.org/packages/c8/39/5cee96809fbca590abea6b46c6d1c586b49663d1d2830a751cc8fc42c666/ruff-0.15.0.tar.gz", hash = "sha256:6bdea47cdbea30d40f8f8d7d69c0854ba7c15420ec75a26f463290949d7f7e9a", size = 4524893, upload-time = "2026-02-03T17:53:35.357Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/bc/88/3fd1b0aa4b6330d6aaa63a285bc96c9f71970351579152d231ed90914586/ruff-0.15.0-py3-none-linux_armv6l.whl", hash = "sha256:aac4ebaa612a82b23d45964586f24ae9bc23ca101919f5590bdb368d74ad5455", size = 10354332, upload-time = "2026-02-03T17:52:54.892Z" },
+    { url = "https://files.pythonhosted.org/packages/72/f6/62e173fbb7eb75cc29fe2576a1e20f0a46f671a2587b5f604bfb0eaf5f6f/ruff-0.15.0-py3-none-macosx_10_12_x86_64.whl", hash = "sha256:dcd4be7cc75cfbbca24a98d04d0b9b36a270d0833241f776b788d59f4142b14d", size = 10767189, upload-time = "2026-02-03T17:53:19.778Z" },
+    { url = "https://files.pythonhosted.org/packages/99/e4/968ae17b676d1d2ff101d56dc69cf333e3a4c985e1ec23803df84fc7bf9e/ruff-0.15.0-py3-none-macosx_11_0_arm64.whl", hash = "sha256:d747e3319b2bce179c7c1eaad3d884dc0a199b5f4d5187620530adf9105268ce", size = 10075384, upload-time = "2026-02-03T17:53:29.241Z" },
+    { url = "https://files.pythonhosted.org/packages/a2/bf/9843c6044ab9e20af879c751487e61333ca79a2c8c3058b15722386b8cae/ruff-0.15.0-py3-none-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:650bd9c56ae03102c51a5e4b554d74d825ff3abe4db22b90fd32d816c2e90621", size = 10481363, upload-time = "2026-02-03T17:52:43.332Z" },
+    { url = "https://files.pythonhosted.org/packages/55/d9/4ada5ccf4cd1f532db1c8d44b6f664f2208d3d93acbeec18f82315e15193/ruff-0.15.0-py3-none-manylinux_2_17_armv7l.manylinux2014_armv7l.whl", hash = "sha256:a6664b7eac559e3048223a2da77769c2f92b43a6dfd4720cef42654299a599c9", size = 10187736, upload-time = "2026-02-03T17:53:00.522Z" },
+    { url = "https://files.pythonhosted.org/packages/86/e2/f25eaecd446af7bb132af0a1d5b135a62971a41f5366ff41d06d25e77a91/ruff-0.15.0-py3-none-manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:6f811f97b0f092b35320d1556f3353bf238763420ade5d9e62ebd2b73f2ff179", size = 10968415, upload-time = "2026-02-03T17:53:15.705Z" },
+    { url = "https://files.pythonhosted.org/packages/e7/dc/f06a8558d06333bf79b497d29a50c3a673d9251214e0d7ec78f90b30aa79/ruff-0.15.0-py3-none-manylinux_2_17_ppc64le.manylinux2014_ppc64le.whl", hash = "sha256:761ec0a66680fab6454236635a39abaf14198818c8cdf691e036f4bc0f406b2d", size = 11809643, upload-time = "2026-02-03T17:53:23.031Z" },
+    { url = "https://files.pythonhosted.org/packages/dd/45/0ece8db2c474ad7df13af3a6d50f76e22a09d078af63078f005057ca59eb/ruff-0.15.0-py3-none-manylinux_2_17_s390x.manylinux2014_s390x.whl", hash = "sha256:940f11c2604d317e797b289f4f9f3fa5555ffe4fb574b55ed006c3d9b6f0eb78", size = 11234787, upload-time = "2026-02-03T17:52:46.432Z" },
+    { url = "https://files.pythonhosted.org/packages/8a/d9/0e3a81467a120fd265658d127db648e4d3acfe3e4f6f5d4ea79fac47e587/ruff-0.15.0-py3-none-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:bcbca3d40558789126da91d7ef9a7c87772ee107033db7191edefa34e2c7f1b4", size = 11112797, upload-time = "2026-02-03T17:52:49.274Z" },
+    { url = "https://files.pythonhosted.org/packages/b2/cb/8c0b3b0c692683f8ff31351dfb6241047fa873a4481a76df4335a8bff716/ruff-0.15.0-py3-none-manylinux_2_31_riscv64.whl", hash = "sha256:9a121a96db1d75fa3eb39c4539e607f628920dd72ff1f7c5ee4f1b768ac62d6e", size = 11033133, upload-time = "2026-02-03T17:53:33.105Z" },
+    { url = "https://files.pythonhosted.org/packages/f8/5e/23b87370cf0f9081a8c89a753e69a4e8778805b8802ccfe175cc410e50b9/ruff-0.15.0-py3-none-musllinux_1_2_aarch64.whl", hash = "sha256:5298d518e493061f2eabd4abd067c7e4fb89e2f63291c94332e35631c07c3662", size = 10442646, upload-time = "2026-02-03T17:53:06.278Z" },
+    { url = "https://files.pythonhosted.org/packages/e1/9a/3c94de5ce642830167e6d00b5c75aacd73e6347b4c7fc6828699b150a5ee/ruff-0.15.0-py3-none-musllinux_1_2_armv7l.whl", hash = "sha256:afb6e603d6375ff0d6b0cee563fa21ab570fd15e65c852cb24922cef25050cf1", size = 10195750, upload-time = "2026-02-03T17:53:26.084Z" },
+    { url = "https://files.pythonhosted.org/packages/30/15/e396325080d600b436acc970848d69df9c13977942fb62bb8722d729bee8/ruff-0.15.0-py3-none-musllinux_1_2_i686.whl", hash = "sha256:77e515f6b15f828b94dc17d2b4ace334c9ddb7d9468c54b2f9ed2b9c1593ef16", size = 10676120, upload-time = "2026-02-03T17:53:09.363Z" },
+    { url = "https://files.pythonhosted.org/packages/8d/c9/229a23d52a2983de1ad0fb0ee37d36e0257e6f28bfd6b498ee2c76361874/ruff-0.15.0-py3-none-musllinux_1_2_x86_64.whl", hash = "sha256:6f6e80850a01eb13b3e42ee0ebdf6e4497151b48c35051aab51c101266d187a3", size = 11201636, upload-time = "2026-02-03T17:52:57.281Z" },
+    { url = "https://files.pythonhosted.org/packages/6f/b0/69adf22f4e24f3677208adb715c578266842e6e6a3cc77483f48dd999ede/ruff-0.15.0-py3-none-win32.whl", hash = "sha256:238a717ef803e501b6d51e0bdd0d2c6e8513fe9eec14002445134d3907cd46c3", size = 10465945, upload-time = "2026-02-03T17:53:12.591Z" },
+    { url = "https://files.pythonhosted.org/packages/51/ad/f813b6e2c97e9b4598be25e94a9147b9af7e60523b0cb5d94d307c15229d/ruff-0.15.0-py3-none-win_amd64.whl", hash = "sha256:dd5e4d3301dc01de614da3cdffc33d4b1b96fb89e45721f1598e5532ccf78b18", size = 11564657, upload-time = "2026-02-03T17:52:51.893Z" },
+    { url = "https://files.pythonhosted.org/packages/f6/b0/2d823f6e77ebe560f4e397d078487e8d52c1516b331e3521bc75db4272ca/ruff-0.15.0-py3-none-win_arm64.whl", hash = "sha256:c480d632cc0ca3f0727acac8b7d053542d9e114a462a145d0b00e7cd658c515a", size = 10865753, upload-time = "2026-02-03T17:53:03.014Z" },
 ]
 
 [[package]]
@@ -978,6 +1113,21 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/39/08/aaaad47bc4e9dc8c725e68f9d04865dbcb2052843ff09c97b08904852d84/urllib3-2.6.3-py3-none-any.whl", hash = "sha256:bf272323e553dfb2e87d9bfd225ca7b0f467b919d7bbd355436d3fd37cb0acd4", size = 131584, upload-time = "2026-01-07T16:24:42.685Z" },
 ]
 
+[[package]]
+name = "virtualenv"
+version = "20.36.1"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "distlib" },
+    { name = "filelock" },
+    { name = "platformdirs" },
+    { name = "typing-extensions", marker = "python_full_version < '3.11'" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/aa/a3/4d310fa5f00863544e1d0f4de93bddec248499ccf97d4791bc3122c9d4f3/virtualenv-20.36.1.tar.gz", hash = "sha256:8befb5c81842c641f8ee658481e42641c68b5eab3521d8e092d18320902466ba", size = 6032239, upload-time = "2026-01-09T18:21:01.296Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/6a/2a/dc2228b2888f51192c7dc766106cd475f1b768c10caaf9727659726f7391/virtualenv-20.36.1-py3-none-any.whl", hash = "sha256:575a8d6b124ef88f6f51d56d656132389f961062a9177016a50e4f507bbcc19f", size = 6008258, upload-time = "2026-01-09T18:20:59.425Z" },
+]
+
 [[package]]
 name = "zipp"
 version = "3.23.0"