From a4c889338316887de7400cdf99434035ed266c50 Mon Sep 17 00:00:00 2001
From: Ahmed Farghal <me@asoli.dev>
Date: Wed, 22 Apr 2026 13:33:13 +0100
Subject: [PATCH] [VQueues] Introducing UserLimiter

---
 Cargo.lock                                    |    2 +
 Cargo.toml                                    |    5 +-
 crates/limiter/src/lib.rs                     |    9 +-
 crates/limiter/src/rule.rs                    |    5 +
 crates/limiter/src/rule_store.rs              |  128 ++
 crates/types/src/lib.rs                       |    7 +
 crates/vqueues/Cargo.toml                     |    1 +
 crates/vqueues/src/scheduler/eligible.rs      |    6 +
 .../vqueues/src/scheduler/resource_manager.rs |   97 +-
 .../src/scheduler/resource_manager/limiter.rs |   31 -
 .../src/scheduler/resource_manager/permit.rs  |   14 +
 .../resource_manager/user_limiter.rs          | 1225 +++++++++++++++++
 util/string/src/restricted_value.rs           |    7 +
 workspace-hack/Cargo.toml                     |    2 +
 14 files changed, 1483 insertions(+), 56 deletions(-)
 delete mode 100644 crates/vqueues/src/scheduler/resource_manager/limiter.rs
 create mode 100644 crates/vqueues/src/scheduler/resource_manager/user_limiter.rs
diff --git a/Cargo.lock b/Cargo.lock
index f136631bbe..ee48207986 100644
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -8457,6 +8457,7 @@ dependencies = [
 name = "restate-vqueues"
 version = "1.6.3-dev"
 dependencies = [
+ "arrayvec",
  "bilrost",
  "derive_more",
  "gardal",
@@ -8582,6 +8583,7 @@ version = "0.0.1"
 dependencies = [
  "adaptive-timeout",
  "ahash",
+ "arrayvec",
  "arrow",
  "arrow-array",
  "arrow-cast",
diff --git a/Cargo.toml b/Cargo.toml
index c81f1d0835..850c14656c 100644
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -107,17 +107,18 @@ adaptive-timeout = { version = "0.0.1-alpha.4" }
 ahash = "0.8.12"
 anyhow = "1.0.100"
 arc-swap = "1.8"
+arrayvec = { version = "0.7" }
 arrow = { version = "57.1.0", default-features = false }
 assert2 = "0.3.16"
 async-channel = "2.5.0"
 async-trait = "0.1.89"
-axum = { version = "0.8.8", default-features = false }
 aws-config = "1.8.12"
-aws-sdk-dynamodb = { version = "1.101.0", default-features = false, features = ["behavior-version-latest", "rt-tokio", "default-https-client"] }
 aws-credential-types = "1.2.11"
+aws-sdk-dynamodb = { version = "1.101.0", default-features = false, features = ["behavior-version-latest", "rt-tokio", "default-https-client"] }
 aws-smithy-async = { version = "1.2.7", default-features = false }
 aws-smithy-runtime-api = "1.9.3"
 aws-smithy-types = "1.3.5"
+axum = { version = "0.8.8", default-features = false }
 base64 = "0.22"
 bilrost = { version = "0.1014", default-features = false, features = ["std", "auto-optimize", "derive"] }
 bincode = { version = "2.0.1", default-features = false }
diff --git a/crates/limiter/src/lib.rs b/crates/limiter/src/lib.rs
index c60681a5fa..037ad725f6 100644
--- a/crates/limiter/src/lib.rs
+++ b/crates/limiter/src/lib.rs
@@ -43,6 +43,11 @@ mod key;
 mod rule;
 mod rule_store;
 
+// Re-exports
+pub use key::LimitKey;
+pub use rule::{Pattern, RuleHandle, RulePattern};
+pub use rule_store::{Limit, Rules, StructuredLimits};
+
 /// Represents the hierarchy level of counters or rules
 ///
 /// This enum is used throughout the limiter to identify which level
@@ -91,7 +96,3 @@ impl std::fmt::Display for Level {
         }
     }
 }
-
-pub use key::LimitKey;
-pub use rule::RulePattern;
-pub use rule_store::{Limit, Rules, StructuredLimits};
diff --git a/crates/limiter/src/rule.rs b/crates/limiter/src/rule.rs
index 3da5efc224..e7e3263bb5 100644
--- a/crates/limiter/src/rule.rs
+++ b/crates/limiter/src/rule.rs
@@ -181,6 +181,11 @@ impl<S: StringLike> Pattern<S> {
         }
     }
 
+    /// A pattern is never empty (wildcards have len 1, exact values are non-empty).
+    pub fn is_empty(&self) -> bool {
+        false
+    }
+
     /// Matches the input and returns a ranking value's most signifcant bit
     fn rank(&self, input: &str, level: Level) -> Option<u8> {
         let msb = Level::COUNT - level as usize;
diff --git a/crates/limiter/src/rule_store.rs b/crates/limiter/src/rule_store.rs
index 0dcb862c0d..e76a2ae6fb 100644
--- a/crates/limiter/src/rule_store.rs
+++ b/crates/limiter/src/rule_store.rs
@@ -41,6 +41,14 @@ impl<V> StructuredLimits<V> {
             l2: Limit::Undefined,
         }
     }
+
+    pub fn limit_at(&self, level: Level) -> &Limit<V> {
+        match level {
+            Level::Scope => &self.scope,
+            Level::Level1 => &self.l1,
+            Level::Level2 => &self.l2,
+        }
+    }
 }
 
 impl<V> Default for StructuredLimits<V> {
@@ -149,6 +157,7 @@ impl<S: StringLike, V> Rules<S, V> {
         }
         store
     }
+
     /// Add a rule to the store.
     pub fn add_rule(&mut self, pattern: RulePattern<S>, limit: V) {
         let level = pattern.level();
@@ -162,6 +171,58 @@ impl<S: StringLike, V> Rules<S, V> {
         }
     }
 
+    /// Finds the rule with the matching pattern and updates its limit in-place
+    /// without invalidating rule handles. If no matching rule exists, inserts a
+    /// new one.
+    pub fn upsert_rule(&mut self, pattern: RulePattern<S>, limit: V) -> RuleHandle {
+        if let Some(handle) = self.find_rule(&pattern) {
+            self.limits.insert(handle, limit);
+            handle
+        } else {
+            let level = pattern.level();
+            let handle = self.rules.insert(pattern);
+            self.limits.insert(handle, limit);
+            match level {
+                Level::Scope => self.scope_rules.push(handle),
+                Level::Level1 => self.l1_rules.push(handle),
+                Level::Level2 => self.l2_rules.push(handle),
+            }
+            handle
+        }
+    }
+
+    /// Removes the rule matching the given pattern.
+    /// Returns the handle and old limit if found.
+    pub fn remove_rule(&mut self, pattern: &RulePattern<S>) -> Option<(RuleHandle, V)> {
+        let handle = self.find_rule(pattern)?;
+
+        let level_rules = match pattern.level() {
+            Level::Scope => &mut self.scope_rules,
+            Level::Level1 => &mut self.l1_rules,
+            Level::Level2 => &mut self.l2_rules,
+        };
+        if let Some(pos) = level_rules.iter().position(|&h| h == handle) {
+            level_rules.swap_remove(pos);
+        }
+
+        self.rules.remove(handle);
+        let limit = self.limits.remove(handle)?;
+        Some((handle, limit))
+    }
+
+    /// Finds an existing rule handle by matching its pattern.
+    fn find_rule(&self, pattern: &RulePattern<S>) -> Option<RuleHandle> {
+        let level_rules = match pattern.level() {
+            Level::Scope => &self.scope_rules,
+            Level::Level1 => &self.l1_rules,
+            Level::Level2 => &self.l2_rules,
+        };
+        level_rules
+            .iter()
+            .copied()
+            .find(|&h| self.rules.get(h).is_some_and(|p| *p == *pattern))
+    }
+
     /// Clear all rules.
     pub fn clear(&mut self) {
         self.scope_rules.clear();
@@ -320,6 +381,73 @@ mod tests {
         assert!(matches!(result.l1, Limit::Undefined));
     }
 
+    #[test]
+    fn upsert_inserts_new_and_updates_existing() {
+        let mut store = store_with_rules(&[("*", 1000), ("scope1/*", 100)]);
+        assert_eq!(store.scope_rules.len(), 1);
+        assert_eq!(store.l1_rules.len(), 1);
+
+        // Upsert existing scope rule: updates limit, same handle
+        let pattern: RulePattern<String> = "*".parse().unwrap();
+        let h1 = store.find_rule(&pattern).unwrap();
+        let h2 = store.upsert_rule(pattern, 2000);
+        assert_eq!(h1, h2);
+        assert_eq!(store.scope_rules.len(), 1);
+        assert_eq!(*store.get_limit(h2).unwrap(), 2000);
+
+        // Upsert new L2 rule: inserts
+        let pattern: RulePattern<String> = "scope1/*/tenant1".parse().unwrap();
+        let h3 = store.upsert_rule(pattern, 10);
+        assert_eq!(store.l2_rules.len(), 1);
+        assert_eq!(*store.get_limit(h3).unwrap(), 10);
+
+        // Lookups reflect the updated and new rules
+        let result = store.lookup("scope1", &LimitKey::None);
+        assert!(matches!(result.scope, Limit::Defined(_, 2000)));
+        let key: LimitKey<String> = "foo/tenant1".parse().unwrap();
+        let result = store.lookup("scope1", &key);
+        assert!(matches!(result.l2, Limit::Defined(_, 10)));
+    }
+
+    #[test]
+    fn remove_rule_removes_and_returns_old_limit() {
+        let mut store = store_with_rules(&[
+            ("*", 1000),
+            ("scope1", 500),
+            ("scope1/*", 100),
+            ("scope1/tenant1", 50),
+        ]);
+        assert_eq!(store.scope_rules.len(), 2);
+        assert_eq!(store.l1_rules.len(), 2);
+
+        // Remove an existing scope rule
+        let pattern: RulePattern<String> = "scope1".parse().unwrap();
+        let (handle, limit) = store.remove_rule(&pattern).unwrap();
+        assert_eq!(limit, 500);
+        assert_eq!(store.scope_rules.len(), 1);
+        assert!(store.rules.get(handle).is_none());
+        assert!(store.limits.get(handle).is_none());
+
+        // Lookups fall back to wildcard now
+        let result = store.lookup("scope1", &LimitKey::None);
+        assert!(matches!(result.scope, Limit::Defined(_, 1000)));
+
+        // Remove a non-existent rule returns None
+        let pattern: RulePattern<String> = "nonexistent".parse().unwrap();
+        assert!(store.remove_rule(&pattern).is_none());
+
+        // Remove an L1 rule
+        let pattern: RulePattern<String> = "scope1/tenant1".parse().unwrap();
+        let (_, limit) = store.remove_rule(&pattern).unwrap();
+        assert_eq!(limit, 50);
+        assert_eq!(store.l1_rules.len(), 1);
+
+        // Lookups fall back to wildcard L1
+        let key: LimitKey<String> = "tenant1".parse().unwrap();
+        let result = store.lookup("scope1", &key);
+        assert!(matches!(result.l1, Limit::Defined(_, 100)));
+    }
+
     #[test]
     fn lookup_only_populates_matching_depth() {
         let store = store_with_rules(&[("*", 1000), ("*/*", 100), ("*/*/*", 10)]);
diff --git a/crates/types/src/lib.rs b/crates/types/src/lib.rs
index 8df2b343a6..2930ad1c57 100644
--- a/crates/types/src/lib.rs
+++ b/crates/types/src/lib.rs
@@ -212,6 +212,13 @@ impl Scope {
     }
 }
 
+// Needed for hashbrown's entry_ref API to lazily convert the key reference on insert.
+impl From<&Scope> for Scope {
+    fn from(value: &Scope) -> Self {
+        value.clone()
+    }
+}
+
 impl AsRef<str> for Scope {
     #[inline]
     fn as_ref(&self) -> &str {
diff --git a/crates/vqueues/Cargo.toml b/crates/vqueues/Cargo.toml
index 42782cda5e..d852ade86e 100644
--- a/crates/vqueues/Cargo.toml
+++ b/crates/vqueues/Cargo.toml
@@ -24,6 +24,7 @@ restate-storage-api = { workspace = true }
 restate-types = { workspace = true }
 restate-util-string = { workspace = true }
 
+arrayvec = { workspace = true }
 bilrost = { workspace = true, features = ["smallvec"] }
 derive_more = { workspace = true, features = ["debug", "is_variant"] }
 gardal = { workspace = true, features = ["tokio"] }
diff --git a/crates/vqueues/src/scheduler/eligible.rs b/crates/vqueues/src/scheduler/eligible.rs
index 0201f449aa..fa72c57f54 100644
--- a/crates/vqueues/src/scheduler/eligible.rs
+++ b/crates/vqueues/src/scheduler/eligible.rs
@@ -236,6 +236,12 @@ impl EligibilityTracker {
         }
     }
 
+    pub fn wake_up_queues(&mut self, vqueues: impl IntoIterator<Item = VQueueHandle>) -> bool {
+        vqueues.into_iter().fold(false, |wake_up, vqueue| {
+            wake_up | self.wake_up_queue(vqueue)
+        })
+    }
+
     /// returns true if the scheduler should be woken up
     pub fn wake_up_queue(&mut self, vqueue: VQueueHandle) -> bool {
         if let Some(state) = self.states.entry(vqueue) {
diff --git a/crates/vqueues/src/scheduler/resource_manager.rs b/crates/vqueues/src/scheduler/resource_manager.rs
index 965f30ce23..1bec778ee0 100644
--- a/crates/vqueues/src/scheduler/resource_manager.rs
+++ b/crates/vqueues/src/scheduler/resource_manager.rs
@@ -11,9 +11,9 @@
 mod invoker;
 mod invoker_memory;
 mod invoker_throttle;
-mod limiter;
 mod locks;
 mod permit;
+mod user_limiter;
 
 pub use self::permit::{PermitBuilder, ReservedResources};
 
@@ -25,19 +25,21 @@ use tokio::sync::mpsc;
 use tracing::trace;
 
 use restate_futures_util::concurrency::Concurrency;
+use restate_limiter::{Level, LimitKey, RuleHandle};
 use restate_memory::{MemoryPool, NonZeroByteCount};
 use restate_storage_api::StorageError;
 use restate_storage_api::lock_table::LoadLocks;
 use restate_storage_api::vqueue_table::{EntryKey, EntryMetadata};
 use restate_types::vqueues::EntryKind;
 use restate_types::{LockName, Scope};
+use restate_util_string::ReString;
 
 use self::invoker::InvokerConcurrencyLimiter;
 use self::invoker_memory::InvokerMemoryLimiter;
 use self::invoker_throttle::InvokerThrottlingLimiter;
-use self::limiter::UserLimiter;
 use self::locks::Locks;
 use self::permit::{ProvisionalPermit, UserPermitKind};
+use self::user_limiter::UserLimiter;
 use super::VQueueHandle;
 use super::eligible::EligibilityTracker;
 use super::queue_meta::VQueueMetaLite;
@@ -53,9 +55,7 @@ pub struct ResourceManager {
     invoker_concurrency: InvokerConcurrencyLimiter,
     invoker_throttling: InvokerThrottlingLimiter,
     invoker_memory: InvokerMemoryLimiter,
-    #[allow(dead_code)]
     user_limiter: UserLimiter,
-    // todo: counters.
     rx: mpsc::UnboundedReceiver<ResourceManagerUpdate>,
     // We need to keep this alive to:
     // - Keep the receiver alive even if we don't have any resource permits handed out
@@ -77,13 +77,22 @@ pub enum ResourceKind {
     InvokerMemory,
     /// Waiting for deployment-level concurrency tokens to be available
     DeploymentConcurrency,
-    /// Waiting for user-defined concurrency to be acquired
-    LimitKeyConcurrency,
+    /// Waiting for user-defined concurrency to be acquired.
+    /// Carries routing info so the eligibility tracker can return it for waiter removal.
+    LimitKeyConcurrency {
+        scope: Scope,
+        limit_key: LimitKey<ReString>,
+        blocked_level: Level,
+        /// Handle to the blocking rule. Resolve via the rules store for display.
+        /// May be stale if the rule was removed since blocking.
+        blocked_rule: Option<RuleHandle>,
+    },
 }
 
+#[allow(dead_code)]
 enum ResourceManagerUpdate {
     PermitReleased(SmallVec<[UserPermitKind; 1]>),
-    // todo: RulesUpdated
+    RulesUpdated(user_limiter::RuleUpdate),
 }
 
 pub(super) enum AcquireOutcome {
@@ -107,7 +116,7 @@ impl ResourceManager {
             invoker_concurrency: InvokerConcurrencyLimiter::new(concurrency_limiter),
             invoker_throttling: InvokerThrottlingLimiter::new(global_throttling),
             invoker_memory: InvokerMemoryLimiter::new(memory_pool, initial_invocation_memory),
-            user_limiter: UserLimiter::default(),
+            user_limiter: UserLimiter::create(),
             locks,
             rx,
             tx: _tx,
@@ -130,7 +139,15 @@ impl ResourceManager {
                 self.invoker_memory.remove_from_waiters(handle);
             }
             ResourceKind::DeploymentConcurrency => todo!(),
-            ResourceKind::LimitKeyConcurrency => todo!(),
+            ResourceKind::LimitKeyConcurrency {
+                scope,
+                limit_key,
+                blocked_level,
+                ..
+            } => {
+                self.user_limiter
+                    .remove_from_waiters(handle, scope, limit_key, *blocked_level);
+            }
         }
     }
 
@@ -167,16 +184,19 @@ impl ResourceManager {
 
         let mut wake_up = false;
         // Release the lock if we have one held
-        if let Some(lock) = permit.lock {
-            wake_up |= self.release_lock(eligible, &lock.scope, &lock.lock_name);
+        if let Some(lock) = permit.lock
+            && let Some(queues) = self.locks.release_lock(&lock.scope, &lock.lock_name)
+        {
+            wake_up |= eligible.wake_up_queues(queues);
         }
 
-        // 1. reclaim resources
-        // 2. collect the vqueues that need to be woken up
         for resource in permit.resources {
             match resource {
-                UserPermitKind::LimitKeyConcurrency(_scope, _limit_key) => {
-                    todo!("pending implementation of hierarchical counters")
+                UserPermitKind::LimitKeyConcurrency(scope, limit_key) => {
+                    let woken = self
+                        .user_limiter
+                        .release_action_concurrency(&scope, &limit_key);
+                    wake_up |= eligible.wake_up_queues(woken);
                 }
             }
         }
@@ -220,6 +240,40 @@ impl ResourceManager {
                 }
             }
 
+            // unscoped entries cannot acquire user limits
+            if let Some(scope) = meta.scope() {
+                let capacity = self
+                    .user_limiter
+                    .check_concurrency_capacity(scope, meta.limit_key());
+                if let Some((blocked_level, blocked_rule)) = capacity.narrowest_blocked() {
+                    trace!(
+                        %scope,
+                        limit_key = %meta.limit_key(),
+                        blocked_at = %blocked_level,
+                        details = %capacity.display(&self.user_limiter),
+                        "User concurrency limit reached",
+                    );
+                    self.user_limiter.add_to_waiters(
+                        vqueue,
+                        scope,
+                        meta.limit_key(),
+                        blocked_level,
+                    );
+                    return AcquireOutcome::BlockedOn(ResourceKind::LimitKeyConcurrency {
+                        scope: scope.clone(),
+                        limit_key: meta.limit_key().clone(),
+                        blocked_level,
+                        blocked_rule,
+                    });
+                }
+
+                // Stage the permit — counters are incremented in secure()
+                provisional.add_permit(UserPermitKind::LimitKeyConcurrency(
+                    scope.clone(),
+                    meta.limit_key().clone(),
+                ));
+            }
+
             // All user requirements are satisfied.
             current_permit.set_user_permit(provisional.secure(self));
         }
@@ -267,16 +321,21 @@ impl ResourceManager {
         while let Poll::Ready(Some(update)) = self.rx.poll_recv(cx) {
             match update {
                 ResourceManagerUpdate::PermitReleased(resources) => {
-                    // 1. reclaim resources
-                    // 2. collect the vqueues that need to be woken up
                     for resource in resources {
                         match resource {
-                            UserPermitKind::LimitKeyConcurrency(_scope, _limit_key) => {
-                                todo!("pending implementation of hierarchical counters")
+                            UserPermitKind::LimitKeyConcurrency(scope, limit_key) => {
+                                let woken = self
+                                    .user_limiter
+                                    .release_action_concurrency(&scope, &limit_key);
+                                eligible.wake_up_queues(woken);
                             }
                         }
                     }
                 }
+                ResourceManagerUpdate::RulesUpdated(update) => {
+                    let woken = self.user_limiter.apply_rule_update(update);
+                    eligible.wake_up_queues(woken);
+                }
             }
         }
 
diff --git a/crates/vqueues/src/scheduler/resource_manager/limiter.rs b/crates/vqueues/src/scheduler/resource_manager/limiter.rs
deleted file mode 100644
index 9e479434aa..0000000000
--- a/crates/vqueues/src/scheduler/resource_manager/limiter.rs
+++ /dev/null
@@ -1,31 +0,0 @@
-// Copyright (c) 2023 - 2026 Restate Software, Inc., Restate GmbH.
-// All rights reserved.
-//
-// Use of this software is governed by the Business Source License
-// included in the LICENSE file.
-//
-// As of the Change Date specified in that file, in accordance with
-// the Business Source License, use of this software will be governed
-// by the Apache License, Version 2.0.
-
-#![allow(dead_code)]
-// todo: Implementation comes in a later stage
-
-use std::num::NonZeroU64;
-
-use restate_limiter::Rules;
-use restate_util_string::ReString;
-
-// This lives here temporarily until it finds a proper home
-#[derive(Default, Clone)]
-pub struct UserLimits {
-    // None means unlimited
-    action_concurrency: Option<NonZeroU64>,
-}
-
-#[allow(dead_code)]
-#[derive(Default)]
-pub struct UserLimiter {
-    /// User defined limits
-    user_limits: Rules<ReString, UserLimits>,
-}
diff --git a/crates/vqueues/src/scheduler/resource_manager/permit.rs b/crates/vqueues/src/scheduler/resource_manager/permit.rs
index 1bb37096e9..20c4fa2452 100644
--- a/crates/vqueues/src/scheduler/resource_manager/permit.rs
+++ b/crates/vqueues/src/scheduler/resource_manager/permit.rs
@@ -163,6 +163,8 @@ impl ProvisionalPermit {
         self.lock = Some(CanonicalLock { scope, lock_name });
     }
 
+    /// Atomically acquires all staged resources. This is the only place where state
+    /// mutations happen — the check phase leading up to this must be side-effect free.
     pub(crate) fn secure(self, resource_manager: &mut ResourceManager) -> UserPermit {
         if let Some(lock) = self.lock.as_ref() {
             resource_manager
@@ -170,6 +172,18 @@ impl ProvisionalPermit {
                 .acquire_lock(lock.scope.clone(), lock.lock_name.clone());
         }
 
+        for resource in &self.resources {
+            match resource {
+                UserPermitKind::LimitKeyConcurrency(scope, limit_key) => {
+                    resource_manager.user_limiter.increment_all(
+                        scope,
+                        limit_key,
+                        super::user_limiter::LimitKind::Concurrency,
+                    );
+                }
+            }
+        }
+
         UserPermit {
             lock: self.lock,
             resources: self.resources,
diff --git a/crates/vqueues/src/scheduler/resource_manager/user_limiter.rs b/crates/vqueues/src/scheduler/resource_manager/user_limiter.rs
new file mode 100644
index 0000000000..0a5d1af961
--- /dev/null
+++ b/crates/vqueues/src/scheduler/resource_manager/user_limiter.rs
@@ -0,0 +1,1225 @@
+// Copyright (c) 2023 - 2026 Restate Software, Inc., Restate GmbH.
+// All rights reserved.
+//
+// Use of this software is governed by the Business Source License
+// included in the LICENSE file.
+//
+// As of the Change Date specified in that file, in accordance with
+// the Business Source License, use of this software will be governed
+// by the Apache License, Version 2.0.
+
+#![allow(clippy::doc_overindented_list_items)]
+//! # Background
+//!
+//! For each vqueue that has scope+limit-key, we track its usage via a set of counters in [`Usage`].
+//! Counters are organized in a trie-like structure, scope->level1->level2. In the case of
+//! concurrency limiting, they track the number of concurrently running invocations (invocations
+//! in the same scope+limit-key in the run stage of inbox across all vqueues within the same scope).
+//!
+//! Permit acquisition is a two-phase process: first, capacity is checked at all applicable levels
+//! without side effects. If all levels have capacity, the permit is staged in a
+//! [`ProvisionalPermit`] and later secured — this is the only point where counters are
+//! incremented and locks are acquired (see [`ProvisionalPermit::secure`]).
+//!
+//! When a permit is released, we decrement the corresponding usage counters on the corresponding
+//! (scope, scope.level1, scope.level1.level2) counters, but we also need to figure out if we have
+//! queues that are waiting for capacity and that can be woken up as a result of this release.
+//!
+//! Consequently, we need to keep track of which vqueues can be woken up when a counter is released,
+//! to do that, let's look at an example.
+//!
+//! Consider the following scenario:
+//! Rules:
+//!   -  scope1/*/tenant1 = 10 (10 limit for concurrent invocations) for l2=tenant1
+//!   -  * = 100   each scope gets a maximum of 100 concurrent invocations
+//!
+//! We have the following running invocations already:
+//!   - x10 invocations with scope1/foo/tenant1 (scope=scope1, limit-key=foo/tenant1)
+//!        counters: scope1, scope1.foo, scope1.foo.tenant1
+//!   - x9 invocations with scope1/bar/tenant1 (scope=scope1, limit-key=bar/tenant1)
+//!        counters: scope1, scope1.bar, scope1.bar.tenant1
+//!   - x1 invocation with scope1/bar (scope=scope1, limit-key=bar)
+//!        counters: scope1, scope1.bar
+//!   - x80 invocations with scope1   (scope=scope1, limit-key=None)
+//!        counters: scope1
+//!
+//! This results in the following state of counters:
+//!   - scope1.foo.tenant1 = 10
+//!   - scope1.foo = 10
+//!   - scope1.bar.tenant1 = 9
+//!   - scope1.bar = 10        (remember that 1 invocation has scope/l1 defined with scope1/bar)
+//!   - scope1 = 100           (sum of all: 10 + 9 + 1 + 80)
+//!
+//! Now, let's walk through a journey of some vqueues trying to acquire new permits.
+//!  - inv1: scope1  (scope=scope1, limit-key=None)
+//!      matching rules:
+//!          * = 100
+//!      matching counters:
+//!          scope1 = 100
+//!      status: BLOCKED on Level=Scope.
+//!
+//!  - inv2: scope1/asoli (scope=scope1, limit-key=asoli)
+//!      matching rules:
+//!          * = 100
+//!      matching counters:
+//!          scope1 = 100     (BLOCKED, on rule *=100)
+//!          scope1.asoli = 0 (allowed, no rule match means unlimited)
+//!
+//!  - inv3: scope1/foo (scope=scope1, limit-key=foo)
+//!      matching rules:
+//!          * = 100
+//!      matching counters:
+//!          scope1 = 100     (BLOCKED, on rule *=100)
+//!          scope1.foo = 10  (allowed, no rule match means unlimited)
+//!
+//!  - inv4: scope1/bar/tenant1 (scope=scope1, limit-key=bar/tenant1)
+//!          * = 100
+//!          scope1/*/tenant1 = 10
+//!      matching counters:
+//!          scope1 = 100      (BLOCKED, on rule *=100)
+//!          scope1.bar = 10   (allowed, no rule match means unlimited)
+//!          scope1.bar.tenant1 = 9  (allowed, on rule scope1/*/tenant1)
+//!
+//!  - inv5: scope1/foo/tenant1 (scope=scope1, limit-key=foo/tenant1)
+//!          * = 100
+//!          scope1/*/tenant1 = 10
+//!      matching counters:
+//!          scope1 = 100      (BLOCKED, on rule *=100)
+//!          scope1.foo = 10   (allowed, no rule match means unlimited)
+//!          scope1.foo.tenant1 = 10  (BLOCKED, on rule scope1/*/tenant1)
+//!
+//!
+//! This illustrates the following:
+//!   1. An invocation/vqueue can be blocked on multiple levels at the same time.
+//!   2. Parent counters are inclusive of their children counters but can be bigger because
+//!      some invocations are invoked directly on their level (e.g. scope1/bar)
+//!   3. Multiple invocations/vqueues can be blocked on the same rule but different concrete
+//!      counters. For instance, inv5 and inv4 at L3-level rule scope1/*/tenant1 but if an
+//!      permit was released (e.g. scope1/foo/tenant1), that would only impact inv5's potential
+//!      eligibility but not inv4's.
+//!   4. A counter at a specific level matches a single rule, or no rule (unlimited). It cannot
+//!      match multiple rules following the rules of precedence defined in `restate-limiter`'s
+//!      rule module. This means that if a rule has been "deleted", or "inserted", some counters
+//!      may match different rules than before and therefore different limits. This also may impact
+//!      the eligibility of vqueues that belong to these counters.
+//!   5. Because a rule may match many counters, one cannot simply say that a vqueue is blocked
+//!      behind a rule. Instead, the combination of the rule _and_ the concrete counter(s) are
+//!      what determines whether a vqueue is eligible or not. A change in any of them would result
+//!      in a _potential_ impact on the eligibility.
+//!
+//! ## Design
+//!
+//! ### Transactional acquisition
+//!
+//! The check phase in `poll_acquire_permit` is side-effect free — it only stages resources in
+//! a [`ProvisionalPermit`]. All state mutations (lock acquisition, counter increments) happen
+//! atomically in [`ProvisionalPermit::secure`]. If any check fails, the provisional is dropped
+//! without side effects, and the vqueue is registered behind the first blocking resource.
+//!
+//! ### Waiter tracking
+//!
+//! Each blocked vqueue is queued behind a single counter — the narrowest (deepest) level where
+//! it's blocked. Waiter lists are embedded directly in the trie nodes ([`ScopeNode`],
+//! [`L1Node`], [`L2Leaf`]) alongside usage counters.
+//!
+//! The routing info (scope, limit_key, blocked_level) is carried in
+//! `ResourceKind::LimitKeyConcurrency` and held by the `EligibilityTracker`. The `UserLimiter`
+//! does not maintain its own membership map — removal uses the routing info passed back from
+//! the eligibility tracker.
+//!
+//! ### Correctness of narrowest-counter queuing
+//!
+//! A permit release always decrements ALL ancestor counters. If the narrowest blocked counter
+//! decreases, all its ancestors also decrease. The vqueue is woken, re-evaluates, and either
+//! proceeds or re-queues at a different narrowest-blocked counter (dynamic migration).
+//!
+//! ### Wake strategy
+//!
+//! On release, we pop at most 1 vqueue from each affected counter's waiter list (up to 3
+//! wakeups per release — one per level). Waking proceeds deepest level first so that vqueues
+//! blocked on the most restrictive counter get priority, since the release directly addresses
+//! their constraint.
+//!
+//! ### Rule updates
+//!
+//! When a rule changes, we only wake waiters at the changed rule's level — not descendants.
+//! Waiters at deeper levels are blocked on something more specific; the shallower change doesn't
+//! help them. When eventually re-evaluated, they see the current rules. Over-limit scenarios
+//! (rule becomes more restrictive while permits are outstanding) use soft enforcement: existing
+//! permits drain naturally, new ones are denied until usage drops below the new limit.
+//!
+//! ### Trie pruning
+//!
+//! After each release, empty trie nodes are pruned bottom-up: L2 leaves, then L1 nodes, then
+//! scope nodes are removed when they have zero usage, no waiters, and no children. This prevents
+//! unbounded trie growth from transient keys.
+//!
+//! Note: usage and waiter counts are related but not strictly coupled. For example, usage can
+//! transiently be zero while waiters still exist if many releases happen before woken vqueues
+//! are re-evaluated.
+
+use std::collections::VecDeque;
+use std::fmt;
+use std::num::NonZeroU64;
+
+use arrayvec::ArrayVec;
+use hashbrown::HashMap;
+
+use restate_limiter::{
+    Level, Limit, LimitKey, Pattern, RuleHandle, RulePattern, Rules, StructuredLimits,
+};
+use restate_types::Scope;
+use restate_util_string::{ReString, RestrictedValue};
+
+use crate::scheduler::VQueueHandle;
+
+#[derive(Clone, Copy, Debug)]
+pub enum LimitKind {
+    Concurrency,
+}
+
+#[derive(Default, Copy, Clone, Debug)]
+pub struct Usage {
+    /// Usage value for [`LimitKind::Concurrency`]
+    concurrency: u32,
+}
+
+impl Usage {
+    fn increment(&mut self, limit_kind: LimitKind) {
+        match limit_kind {
+            LimitKind::Concurrency => self.concurrency += 1,
+        }
+    }
+
+    fn decrement(&mut self, limit_kind: LimitKind) {
+        match limit_kind {
+            LimitKind::Concurrency => self.concurrency = self.concurrency.saturating_sub(1),
+        }
+    }
+
+    fn is_zero(&self) -> bool {
+        self.concurrency == 0
+    }
+}
+
+// This lives here temporarily until it finds a proper home
+#[derive(Debug, Default, Clone)]
+pub struct UserLimits {
+    // None means unlimited
+    action_concurrency: Option<NonZeroU64>,
+}
+
+impl UserLimits {
+    #[cfg(test)]
+    pub fn new(action_concurrency: Option<NonZeroU64>) -> Self {
+        Self { action_concurrency }
+    }
+}
+
+pub struct UserLimiter {
+    state: State,
+    rules: Rules<ReString, UserLimits>,
+}
+
+impl UserLimiter {
+    pub fn create() -> Self {
+        Self {
+            rules: Rules::default(),
+            state: Default::default(),
+        }
+    }
+
+    /// Checks capacity for the given scope + limit key across all hierarchy levels.
+    ///
+    /// Returns a [`CapacityResult`] that the caller can inspect, log, or store.
+    /// Use [`CapacityResult::has_capacity`] or [`CapacityResult::narrowest_blocked`] to
+    /// determine the outcome.
+    pub(super) fn check_concurrency_capacity(
+        &self,
+        scope: &Scope,
+        limit_key: &LimitKey<ReString>,
+    ) -> CapacityResult {
+        let limits = self.rules.lookup(scope.as_str(), limit_key);
+        self.state
+            .check_capacity(scope, limit_key, LimitKind::Concurrency, &limits)
+    }
+
+    /// Increments usage counters at all levels along the path (scope → l1 → l2).
+    pub(super) fn increment_all(
+        &mut self,
+        scope: &Scope,
+        limit_key: &LimitKey<ReString>,
+        limit_kind: LimitKind,
+    ) {
+        self.state.increment_all(scope, limit_key, limit_kind);
+    }
+
+    /// Decrements usage counters and wakes up to 1 vqueue per affected counter level.
+    ///
+    /// Returns up to 3 vqueue handles that should be woken via `EligibilityTracker`.
+    pub(super) fn release_action_concurrency(
+        &mut self,
+        scope: &Scope,
+        limit_key: &LimitKey<ReString>,
+    ) -> ArrayVec<VQueueHandle, { Level::COUNT }> {
+        self.state
+            .decrement_and_wake(scope, limit_key, LimitKind::Concurrency)
+    }
+
+    /// Adds a vqueue to the waiter list at the specified trie node.
+    pub(super) fn add_to_waiters(
+        &mut self,
+        handle: VQueueHandle,
+        scope: &Scope,
+        limit_key: &LimitKey<ReString>,
+        blocked_level: Level,
+    ) {
+        self.state
+            .add_to_waiters(handle, scope, limit_key, blocked_level);
+    }
+
+    /// Removes a vqueue from the waiter list using caller-provided routing info.
+    pub(super) fn remove_from_waiters(
+        &mut self,
+        handle: VQueueHandle,
+        scope: &Scope,
+        limit_key: &LimitKey<ReString>,
+        blocked_level: Level,
+    ) {
+        self.state
+            .remove_from_waiters(handle, scope, limit_key, blocked_level);
+    }
+
+    /// Applies a rule update (add, remove, or update) and returns vqueues that need re-evaluation.
+    ///
+    /// This uses soft enforcement: existing permits that exceed new lower limits are not revoked;
+    /// the system simply stops issuing new permits until usage drains below the new limit.
+    pub(super) fn apply_rule_update(&mut self, update: RuleUpdate) -> Vec<VQueueHandle> {
+        let pattern = match &update {
+            RuleUpdate::Upsert { pattern, .. } => pattern.clone(),
+            RuleUpdate::Remove { pattern } => pattern.clone(),
+        };
+
+        // Apply the mutation to the rules store
+        match update {
+            RuleUpdate::Upsert { pattern, limit } => {
+                self.rules.upsert_rule(pattern, limit);
+            }
+            RuleUpdate::Remove { pattern } => {
+                self.rules.remove_rule(&pattern);
+            }
+        }
+
+        // Walk the trie guided by the pattern and drain affected waiter lists
+        self.state.drain_affected_waiters(&pattern)
+    }
+
+    /// Resolves a rule handle to its pattern. Returns `None` if the handle is stale
+    /// (rule was removed since the handle was captured).
+    #[allow(dead_code)]
+    pub fn resolve_rule(&self, handle: RuleHandle) -> Option<&RulePattern<ReString>> {
+        self.rules.get_pattern(handle)
+    }
+}
+
+/// Describes a rule mutation.
+#[allow(dead_code)]
+pub enum RuleUpdate {
+    /// Insert a new rule or update an existing one with the same pattern.
+    Upsert {
+        pattern: RulePattern<ReString>,
+        limit: UserLimits,
+    },
+    /// Remove a rule by its pattern.
+    Remove { pattern: RulePattern<ReString> },
+}
+
+#[derive(Debug, Default)]
+struct State {
+    scopes: HashMap<Scope, ScopeNode>,
+}
+
+/// Scope-level trie node with usage counter, waiter list, and L1 children.
+#[derive(Debug, Default)]
+struct ScopeNode {
+    value: Usage,
+    waiters: VecDeque<VQueueHandle>,
+    l1: HashMap<RestrictedValue<ReString>, L1Node>,
+}
+
+/// L1-level trie node with usage counter, waiter list, and L2 children.
+#[derive(Debug, Default)]
+struct L1Node {
+    value: Usage,
+    waiters: VecDeque<VQueueHandle>,
+    l2: HashMap<RestrictedValue<ReString>, L2Leaf>,
+}
+
+impl ScopeNode {
+    /// Returns true if this node has no usage, no waiters, and no children.
+    fn is_unused(&self) -> bool {
+        self.value.is_zero() && self.waiters.is_empty() && self.l1.is_empty()
+    }
+}
+
+impl L1Node {
+    /// Returns true if this node has no usage, no waiters, and no children.
+    fn is_unused(&self) -> bool {
+        self.value.is_zero() && self.waiters.is_empty() && self.l2.is_empty()
+    }
+}
+
+/// L2-level trie leaf with usage counter and waiter list.
+#[derive(Debug, Default)]
+struct L2Leaf {
+    value: Usage,
+    waiters: VecDeque<VQueueHandle>,
+}
+
+impl L2Leaf {
+    fn is_unused(&self) -> bool {
+        self.value.is_zero() && self.waiters.is_empty()
+    }
+}
+
+impl State {
+    fn increment_all(
+        &mut self,
+        scope: &Scope,
+        limit_key: &LimitKey<ReString>,
+        limit_kind: LimitKind,
+    ) {
+        let scope_node = self.scopes.entry_ref(scope).or_default();
+        scope_node.value.increment(limit_kind);
+        match limit_key {
+            LimitKey::None => {}
+            LimitKey::L1(l1) => {
+                scope_node
+                    .l1
+                    .entry_ref(l1)
+                    .or_default()
+                    .value
+                    .increment(limit_kind);
+            }
+            LimitKey::L2(l1, l2) => {
+                let l1_node = scope_node.l1.entry_ref(l1).or_default();
+                l1_node.value.increment(limit_kind);
+                l1_node
+                    .l2
+                    .entry_ref(l2)
+                    .or_default()
+                    .value
+                    .increment(limit_kind);
+            }
+        }
+    }
+
+    /// Decrements counters along the path and pops at most 1 waiter per affected level.
+    ///
+    /// Wakes deepest level first so that vqueues blocked on the most restrictive (narrowest)
+    /// counter get priority — they are most likely to succeed since the release directly
+    /// addresses their constraint.
+    ///
+    /// After waking, prunes empty trie nodes bottom-up to avoid unbounded growth.
+    fn decrement_and_wake(
+        &mut self,
+        scope: &Scope,
+        limit_key: &LimitKey<ReString>,
+        limit_kind: LimitKind,
+    ) -> ArrayVec<VQueueHandle, { Level::COUNT }> {
+        let mut woken = ArrayVec::new();
+
+        let Some(scope_node) = self.scopes.get_mut(scope) else {
+            return woken;
+        };
+
+        // Decrement all affected counters top-down (natural traversal order)
+        scope_node.value.decrement(limit_kind);
+        match limit_key {
+            LimitKey::None => {}
+            LimitKey::L1(l1) => {
+                if let Some(l1_node) = scope_node.l1.get_mut(l1) {
+                    l1_node.value.decrement(limit_kind);
+                }
+            }
+            LimitKey::L2(l1, l2) => {
+                if let Some(l1_node) = scope_node.l1.get_mut(l1) {
+                    l1_node.value.decrement(limit_kind);
+                    if let Some(l2_leaf) = l1_node.l2.get_mut(l2) {
+                        l2_leaf.value.decrement(limit_kind);
+                    } else {
+                        debug_assert!(
+                            false,
+                            "missing Level2 node for released key: scope='{}', l1='{}', l2='{}'",
+                            scope, l1, l2,
+                        );
+                    }
+                } else {
+                    debug_assert!(
+                        false,
+                        "missing Level1 node for released key: scope='{}', l1='{}'",
+                        scope, l1,
+                    );
+                }
+            }
+        }
+
+        // Wake deepest level first — vqueues blocked on narrower counters have
+        // more restrictive limits and are most likely to benefit from this release.
+        match limit_key {
+            LimitKey::None => {}
+            LimitKey::L2(l1, l2) => {
+                if let Some(l1_node) = scope_node.l1.get_mut(l1) {
+                    if let Some(l2_leaf) = l1_node.l2.get_mut(l2)
+                        && let Some(h) = l2_leaf.waiters.pop_front()
+                    {
+                        woken.push(h);
+                    }
+                    if let Some(h) = l1_node.waiters.pop_front() {
+                        woken.push(h);
+                    }
+                }
+            }
+            LimitKey::L1(l1) => {
+                if let Some(l1_node) = scope_node.l1.get_mut(l1)
+                    && let Some(h) = l1_node.waiters.pop_front()
+                {
+                    woken.push(h);
+                }
+            }
+        }
+        if let Some(h) = scope_node.waiters.pop_front() {
+            woken.push(h);
+        }
+
+        // Prune empty nodes bottom-up
+        match limit_key {
+            LimitKey::None => {}
+            LimitKey::L1(l1) => {
+                if scope_node.l1.get(l1).is_some_and(|n| n.is_unused()) {
+                    scope_node.l1.remove(l1);
+                }
+            }
+            LimitKey::L2(l1, l2) => {
+                if let Some(l1_node) = scope_node.l1.get_mut(l1)
+                    && l1_node.l2.get(l2).is_some_and(|n| n.is_unused())
+                {
+                    l1_node.l2.remove(l2);
+                }
+                if scope_node.l1.get(l1).is_some_and(|n| n.is_unused()) {
+                    scope_node.l1.remove(l1);
+                }
+            }
+        }
+        if scope_node.is_unused() {
+            self.scopes.remove(scope);
+        }
+
+        woken
+    }
+
+    fn add_to_waiters(
+        &mut self,
+        handle: VQueueHandle,
+        scope: &Scope,
+        limit_key: &LimitKey<ReString>,
+        blocked_level: Level,
+    ) {
+        let scope_node = self.scopes.entry_ref(scope).or_default();
+        match blocked_level {
+            Level::Scope => {
+                scope_node.waiters.push_back(handle);
+            }
+            Level::Level1 => {
+                let l1_key = limit_key
+                    .level1()
+                    .expect("L1 key required for Level1 block");
+                scope_node
+                    .l1
+                    .entry_ref(l1_key)
+                    .or_default()
+                    .waiters
+                    .push_back(handle);
+            }
+            Level::Level2 => {
+                let l1_key = limit_key
+                    .level1()
+                    .expect("L1 key required for Level2 block");
+                let l2_key = limit_key
+                    .level2()
+                    .expect("L2 key required for Level2 block");
+                scope_node
+                    .l1
+                    .entry_ref(l1_key)
+                    .or_default()
+                    .l2
+                    .entry_ref(l2_key)
+                    .or_default()
+                    .waiters
+                    .push_back(handle);
+            }
+        }
+    }
+
+    fn remove_from_waiters(
+        &mut self,
+        handle: VQueueHandle,
+        scope: &Scope,
+        limit_key: &LimitKey<ReString>,
+        blocked_level: Level,
+    ) {
+        let Some(scope_node) = self.scopes.get_mut(scope) else {
+            return;
+        };
+        match blocked_level {
+            Level::Scope => {
+                scope_node.waiters.retain(|h| *h != handle);
+            }
+            Level::Level1 => {
+                if let Some(l1_key) = limit_key.level1()
+                    && let Some(l1_node) = scope_node.l1.get_mut(l1_key)
+                {
+                    l1_node.waiters.retain(|h| *h != handle);
+                }
+            }
+            Level::Level2 => {
+                if let Some(l1_key) = limit_key.level1()
+                    && let Some(l1_node) = scope_node.l1.get_mut(l1_key)
+                    && let Some(l2_key) = limit_key.level2()
+                    && let Some(l2_leaf) = l1_node.l2.get_mut(l2_key)
+                {
+                    l2_leaf.waiters.retain(|h| *h != handle);
+                }
+            }
+        }
+    }
+
+    /// Walks the trie guided by a rule pattern and drains waiter lists from all matching
+    /// nodes at the pattern's target level.
+    ///
+    /// Uses `Pattern::Exact` for O(1) lookups and `Pattern::Wildcard` for iterating all
+    /// entries at that level. Only drains waiters at the rule's own level, not descendants.
+    fn drain_affected_waiters(&mut self, pattern: &RulePattern<ReString>) -> Vec<VQueueHandle> {
+        let mut woken = Vec::new();
+        match pattern {
+            RulePattern::Scope(scope_pat) => {
+                for_each_matching_scope(&mut self.scopes, scope_pat, |scope_node| {
+                    woken.extend(scope_node.waiters.drain(..));
+                });
+            }
+            RulePattern::L1 {
+                scope: scope_pat,
+                l1: l1_pat,
+            } => {
+                for_each_matching_scope(&mut self.scopes, scope_pat, |scope_node| {
+                    for_each_matching(&mut scope_node.l1, l1_pat, |l1_node| {
+                        woken.extend(l1_node.waiters.drain(..));
+                    });
+                });
+            }
+            RulePattern::L2 {
+                scope: scope_pat,
+                l1: l1_pat,
+                l2: l2_pat,
+            } => {
+                for_each_matching_scope(&mut self.scopes, scope_pat, |scope_node| {
+                    for_each_matching(&mut scope_node.l1, l1_pat, |l1_node| {
+                        for_each_matching(&mut l1_node.l2, l2_pat, |l2_leaf| {
+                            woken.extend(l2_leaf.waiters.drain(..));
+                        });
+                    });
+                });
+            }
+        }
+        woken
+    }
+
+    fn check_capacity(
+        &self,
+        scope: &Scope,
+        limit_key: &LimitKey<ReString>,
+        limit_kind: LimitKind,
+        limits: &StructuredLimits<&UserLimits>,
+    ) -> CapacityResult {
+        match limit_key {
+            LimitKey::None => self.check_scope(limit_kind, scope, limits),
+            LimitKey::L1(l1) => self.check_l1(limit_kind, scope, l1, limits),
+            LimitKey::L2(l1, l2) => self.check_l1_l2(limit_kind, scope, l1, l2, limits),
+        }
+    }
+
+    fn check_scope(
+        &self,
+        limit_kind: LimitKind,
+        scope: &Scope,
+        limits: &StructuredLimits<&UserLimits>,
+    ) -> CapacityResult {
+        let current = self.scopes.get(scope).map(|n| &n.value);
+        let mut levels = ArrayVec::new();
+        levels.push(make_level_status(
+            Level::Scope,
+            current,
+            limits.limit_at(Level::Scope),
+            limit_kind,
+        ));
+        CapacityResult { levels }
+    }
+
+    fn check_l1(
+        &self,
+        limit_kind: LimitKind,
+        scope: &Scope,
+        l1: &RestrictedValue<ReString>,
+        limits: &StructuredLimits<&UserLimits>,
+    ) -> CapacityResult {
+        let (scope_current, l1_current) = match self.scopes.get(scope) {
+            Some(sn) => (Some(&sn.value), sn.l1.get(l1).map(|n| &n.value)),
+            None => (None, None),
+        };
+
+        let mut levels = ArrayVec::new();
+        levels.push(make_level_status(
+            Level::Scope,
+            scope_current,
+            limits.limit_at(Level::Scope),
+            limit_kind,
+        ));
+        levels.push(make_level_status(
+            Level::Level1,
+            l1_current,
+            limits.limit_at(Level::Level1),
+            limit_kind,
+        ));
+        CapacityResult { levels }
+    }
+
+    fn check_l1_l2(
+        &self,
+        limit_kind: LimitKind,
+        scope: &Scope,
+        l1: &RestrictedValue<ReString>,
+        l2: &RestrictedValue<ReString>,
+        limits: &StructuredLimits<&UserLimits>,
+    ) -> CapacityResult {
+        let (scope_current, l1_current, l2_current) = match self.scopes.get(scope) {
+            Some(sn) => {
+                let l1n = sn.l1.get(l1);
+                (
+                    Some(&sn.value),
+                    l1n.map(|n| &n.value),
+                    l1n.and_then(|n| n.l2.get(l2)).map(|leaf| &leaf.value),
+                )
+            }
+            None => (None, None, None),
+        };
+
+        let mut levels = ArrayVec::new();
+        levels.push(make_level_status(
+            Level::Scope,
+            scope_current,
+            limits.limit_at(Level::Scope),
+            limit_kind,
+        ));
+        levels.push(make_level_status(
+            Level::Level1,
+            l1_current,
+            limits.limit_at(Level::Level1),
+            limit_kind,
+        ));
+        levels.push(make_level_status(
+            Level::Level2,
+            l2_current,
+            limits.limit_at(Level::Level2),
+            limit_kind,
+        ));
+        CapacityResult { levels }
+    }
+}
+
+/// Applies `f` to each scope node matching the scope pattern.
+fn for_each_matching_scope(
+    scopes: &mut HashMap<Scope, ScopeNode>,
+    pat: &Pattern<ReString>,
+    mut f: impl FnMut(&mut ScopeNode),
+) {
+    match pat {
+        Pattern::Exact(val) => {
+            if let Some(node) = scopes.get_mut(val.as_str()) {
+                f(node);
+            }
+        }
+        Pattern::Wildcard => {
+            for node in scopes.values_mut() {
+                f(node);
+            }
+        }
+    }
+}
+
+/// Applies `f` to each entry in a `HashMap<RestrictedValue<ReString>, V>` matching the pattern.
+fn for_each_matching<V>(
+    map: &mut HashMap<RestrictedValue<ReString>, V>,
+    pat: &Pattern<ReString>,
+    mut f: impl FnMut(&mut V),
+) {
+    match pat {
+        Pattern::Exact(val) => {
+            if let Some(node) = map.get_mut(val) {
+                f(node);
+            }
+        }
+        Pattern::Wildcard => {
+            for node in map.values_mut() {
+                f(node);
+            }
+        }
+    }
+}
+
+/// Result of a capacity check across all applicable hierarchy levels.
+#[derive(Clone, Debug)]
+pub struct CapacityResult {
+    /// Status for each applicable level (stack-allocated, up to 3).
+    levels: ArrayVec<LevelStatus, { Level::COUNT }>,
+}
+
+#[allow(dead_code)]
+impl CapacityResult {
+    /// Returns `true` if all levels have capacity available.
+    pub fn has_capacity(&self) -> bool {
+        self.levels.iter().all(|l| l.has_capacity())
+    }
+
+    /// Returns the narrowest (deepest) blocked level and its rule handle.
+    /// Returns `None` if all levels have capacity.
+    pub fn narrowest_blocked(&self) -> Option<(Level, Option<RuleHandle>)> {
+        self.levels
+            .iter()
+            .rev()
+            .find(|l| !l.has_capacity())
+            .map(|l| (l.level, l.rule_handle))
+    }
+
+    /// Iterates over per-level status entries.
+    pub fn iter(&self) -> impl Iterator<Item = &LevelStatus> {
+        self.levels.iter()
+    }
+}
+
+impl CapacityResult {
+    /// Creates a display wrapper that resolves rule handles to their patterns
+    /// via the provided [`UserLimiter`].
+    pub fn display<'a>(&'a self, limiter: &'a UserLimiter) -> CapacityResultDisplay<'a> {
+        CapacityResultDisplay {
+            result: self,
+            limiter,
+        }
+    }
+}
+
+/// Display wrapper for [`CapacityResult`] that resolves rule handles to patterns.
+///
+/// Created via [`CapacityResult::display`].
+pub struct CapacityResultDisplay<'a> {
+    result: &'a CapacityResult,
+    limiter: &'a UserLimiter,
+}
+
+impl fmt::Display for CapacityResultDisplay<'_> {
+    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
+        let mut first = true;
+        for status in &self.result.levels {
+            if !first {
+                write!(f, ", ")?;
+            }
+            first = false;
+
+            write!(f, "{}={}/", status.level, status.usage)?;
+            match status.limit_value {
+                None => write!(f, "unlimited")?,
+                Some(limit) => {
+                    write!(f, "{}", limit)?;
+                    // Resolve the rule pattern for context
+                    if let Some(handle) = status.rule_handle {
+                        match self.limiter.resolve_rule(handle) {
+                            Some(pattern) => write!(f, " [{}]", pattern)?,
+                            None => write!(f, " [rule removed]")?,
+                        }
+                    }
+                    let tag = if status.has_capacity() {
+                        "ok"
+                    } else {
+                        "BLOCKED"
+                    };
+                    write!(f, " ({})", tag)?;
+                }
+            }
+        }
+        Ok(())
+    }
+}
+
+/// Status of a single level's capacity.
+#[derive(Clone, Debug)]
+pub struct LevelStatus {
+    /// The hierarchy level (Scope, Level1, or Level2).
+    pub level: Level,
+    /// Current usage at this level.
+    pub usage: u32,
+    /// The configured limit, or `None` if unlimited.
+    pub limit_value: Option<NonZeroU64>,
+    /// Handle to the rule defining the limit. `None` if unlimited.
+    /// Resolve via [`UserLimiter::resolve_rule`] for display.
+    pub rule_handle: Option<RuleHandle>,
+}
+
+#[allow(dead_code)]
+impl LevelStatus {
+    /// Returns `true` if this level has capacity available.
+    pub fn has_capacity(&self) -> bool {
+        self.limit_value
+            .map(|limit| (self.usage as u64) < limit.get())
+            .unwrap_or(true)
+    }
+
+    /// Returns the available capacity, or `None` if unlimited.
+    pub fn available(&self) -> Option<u64> {
+        self.limit_value
+            .map(|limit| limit.get().saturating_sub(self.usage as u64))
+    }
+}
+
+/// Constructs a [`LevelStatus`] from the trie usage and the resolved limit.
+fn make_level_status(
+    level: Level,
+    current: Option<&Usage>,
+    limit: &Limit<&UserLimits>,
+    limit_kind: LimitKind,
+) -> LevelStatus {
+    let usage = current.map_or(0, |u| match limit_kind {
+        LimitKind::Concurrency => u.concurrency,
+    });
+    let (limit_value, rule_handle) = match limit {
+        Limit::Undefined => (None, None),
+        Limit::Defined(handle, user_limits) => {
+            let value = match limit_kind {
+                LimitKind::Concurrency => user_limits.action_concurrency,
+            };
+            (value, Some(*handle))
+        }
+    };
+    LevelStatus {
+        level,
+        usage,
+        limit_value,
+        rule_handle,
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use std::num::NonZeroU64;
+
+    use restate_limiter::{LimitKey, RulePattern};
+    use restate_util_string::ReString;
+
+    use super::*;
+
+    fn scope(s: &str) -> Scope {
+        Scope::new(s)
+    }
+
+    fn limit_key(s: &str) -> LimitKey<ReString> {
+        s.parse().unwrap()
+    }
+
+    fn rule(s: &str) -> RulePattern<ReString> {
+        s.parse().unwrap()
+    }
+
+    fn limits(concurrency: u64) -> UserLimits {
+        UserLimits::new(NonZeroU64::new(concurrency))
+    }
+
+    /// Creates a UserLimiter with the given rules.
+    fn limiter_with_rules(specs: &[(&str, u64)]) -> UserLimiter {
+        let rules = Rules::from_rules(specs.iter().map(|(pat, limit)| {
+            (
+                pat.parse::<RulePattern<ReString>>().unwrap(),
+                limits(*limit),
+            )
+        }));
+        UserLimiter {
+            rules,
+            state: Default::default(),
+        }
+    }
+
+    // Fake VQueueHandle for testing. The slotmap key needs to be created via a SlotMap.
+    fn make_handles(n: usize) -> (slotmap::SlotMap<VQueueHandle, ()>, Vec<VQueueHandle>) {
+        let mut sm = slotmap::SlotMap::with_key();
+        let handles: Vec<_> = (0..n).map(|_| sm.insert(())).collect();
+        (sm, handles)
+    }
+
+    #[test]
+    fn check_capacity_unlimited() {
+        let limiter = limiter_with_rules(&[]);
+        let result = limiter.check_concurrency_capacity(&scope("s1"), &LimitKey::None);
+        assert!(result.has_capacity());
+    }
+
+    #[test]
+    fn check_capacity_with_headroom() {
+        let mut limiter = limiter_with_rules(&[("*", 10)]);
+        for _ in 0..5 {
+            limiter.increment_all(&scope("s1"), &LimitKey::None, LimitKind::Concurrency);
+        }
+        let result = limiter.check_concurrency_capacity(&scope("s1"), &LimitKey::None);
+        assert!(result.has_capacity());
+    }
+
+    #[test]
+    fn check_capacity_blocked_at_scope() {
+        let mut limiter = limiter_with_rules(&[("*", 2)]);
+        let s = scope("s1");
+        limiter.increment_all(&s, &LimitKey::None, LimitKind::Concurrency);
+        limiter.increment_all(&s, &LimitKey::None, LimitKind::Concurrency);
+
+        let result = limiter.check_concurrency_capacity(&s, &LimitKey::None);
+        let (level, rule_handle) = result.narrowest_blocked().unwrap();
+        assert_eq!(level, Level::Scope);
+        let rule = limiter.resolve_rule(rule_handle.unwrap()).unwrap();
+        assert_eq!(rule.to_string(), "*");
+    }
+
+    #[test]
+    fn check_capacity_blocked_at_l2_narrowest() {
+        // scope limit = 100, L2 limit = 2
+        let mut limiter = limiter_with_rules(&[("*", 100), ("s1/*/t1", 2)]);
+        let s = scope("s1");
+        let lk = limit_key("foo/t1");
+
+        limiter.increment_all(&s, &lk, LimitKind::Concurrency);
+        limiter.increment_all(&s, &lk, LimitKind::Concurrency);
+
+        // s1=2 (under 100), s1.foo=2 (unlimited), s1.foo.t1=2 (at limit)
+        let result = limiter.check_concurrency_capacity(&s, &lk);
+        let (level, rule_handle) = result.narrowest_blocked().unwrap();
+        assert_eq!(level, Level::Level2);
+        let rule = limiter.resolve_rule(rule_handle.unwrap()).unwrap();
+        assert_eq!(rule.to_string(), "s1/*/t1");
+    }
+
+    #[test]
+    fn check_capacity_blocked_on_both_scope_and_l2_returns_narrowest() {
+        let mut limiter = limiter_with_rules(&[("*", 2), ("s1/*/t1", 2)]);
+        let s = scope("s1");
+        let lk = limit_key("foo/t1");
+
+        limiter.increment_all(&s, &lk, LimitKind::Concurrency);
+        limiter.increment_all(&s, &lk, LimitKind::Concurrency);
+
+        // Both scope and L2 are at limit; narrowest is L2
+        let result = limiter.check_concurrency_capacity(&s, &lk);
+        let (level, _) = result.narrowest_blocked().unwrap();
+        assert_eq!(level, Level::Level2);
+    }
+
+    #[test]
+    fn increment_and_decrement_all_levels() {
+        let mut limiter = limiter_with_rules(&[]);
+        let s = scope("s1");
+        let lk = limit_key("foo/bar");
+
+        limiter.increment_all(&s, &lk, LimitKind::Concurrency);
+        limiter.increment_all(&s, &lk, LimitKind::Concurrency);
+
+        assert_eq!(limiter.state.scopes[&s].value.concurrency, 2);
+        let l1 = lk.level1().unwrap();
+        assert_eq!(limiter.state.scopes[&s].l1[l1].value.concurrency, 2);
+        let l2 = lk.level2().unwrap();
+        assert_eq!(limiter.state.scopes[&s].l1[l1].l2[l2].value.concurrency, 2);
+
+        // Decrement via release (also pops waiters, but there are none)
+        let woken = limiter.release_action_concurrency(&s, &lk);
+        assert!(woken.is_empty());
+        assert_eq!(limiter.state.scopes[&s].value.concurrency, 1);
+        assert_eq!(limiter.state.scopes[&s].l1[l1].value.concurrency, 1);
+        assert_eq!(limiter.state.scopes[&s].l1[l1].l2[l2].value.concurrency, 1);
+    }
+
+    #[test]
+    fn release_prunes_empty_trie_nodes() {
+        let mut limiter = limiter_with_rules(&[]);
+        let s = scope("s1");
+        let lk = limit_key("foo/bar");
+
+        limiter.increment_all(&s, &lk, LimitKind::Concurrency);
+        assert!(limiter.state.scopes.contains_key(&s));
+
+        // Release the single permit — all counters go to zero, nodes should be pruned
+        limiter.release_action_concurrency(&s, &lk);
+        assert!(
+            !limiter.state.scopes.contains_key(&s),
+            "scope node should be pruned when fully empty"
+        );
+
+        // Partial pruning: scope still has usage from a different path
+        limiter.increment_all(&s, &lk, LimitKind::Concurrency);
+        limiter.increment_all(&s, &LimitKey::None, LimitKind::Concurrency);
+
+        // Release the L2 path — L2 and L1 should be pruned, but scope stays (has usage=1)
+        limiter.release_action_concurrency(&s, &lk);
+        assert!(limiter.state.scopes.contains_key(&s));
+        let l1 = lk.level1().unwrap();
+        assert!(
+            !limiter.state.scopes[&s].l1.contains_key(l1),
+            "l1 node should be pruned when its subtree is empty"
+        );
+    }
+
+    #[test]
+    fn add_and_remove_waiters() {
+        let mut limiter = limiter_with_rules(&[]);
+        let (_sm, handles) = make_handles(3);
+        let s = scope("s1");
+        let lk = limit_key("foo/bar");
+
+        // Add waiters at different levels
+        limiter.add_to_waiters(handles[0], &s, &LimitKey::None, Level::Scope);
+        limiter.add_to_waiters(handles[1], &s, &lk, Level::Level1);
+        limiter.add_to_waiters(handles[2], &s, &lk, Level::Level2);
+
+        // Verify they're there
+        assert_eq!(limiter.state.scopes[&s].waiters.len(), 1);
+        let l1 = lk.level1().unwrap();
+        assert_eq!(limiter.state.scopes[&s].l1[l1].waiters.len(), 1);
+        let l2 = lk.level2().unwrap();
+        assert_eq!(limiter.state.scopes[&s].l1[l1].l2[l2].waiters.len(), 1);
+
+        // Remove the L1 waiter
+        limiter.remove_from_waiters(handles[1], &s, &lk, Level::Level1);
+        assert_eq!(limiter.state.scopes[&s].l1[l1].waiters.len(), 0);
+        // Others untouched
+        assert_eq!(limiter.state.scopes[&s].waiters.len(), 1);
+        assert_eq!(limiter.state.scopes[&s].l1[l1].l2[l2].waiters.len(), 1);
+    }
+
+    #[test]
+    fn release_wakes_one_per_level() {
+        let mut limiter = limiter_with_rules(&[("*", 2)]);
+        let (_sm, handles) = make_handles(6);
+        let s = scope("s1");
+        let lk = limit_key("foo/bar");
+
+        // Fill up counters
+        limiter.increment_all(&s, &lk, LimitKind::Concurrency);
+        limiter.increment_all(&s, &lk, LimitKind::Concurrency);
+
+        // Park 2 waiters at each level
+        limiter.add_to_waiters(handles[0], &s, &LimitKey::None, Level::Scope);
+        limiter.add_to_waiters(handles[1], &s, &LimitKey::None, Level::Scope);
+        limiter.add_to_waiters(handles[2], &s, &lk, Level::Level1);
+        limiter.add_to_waiters(handles[3], &s, &lk, Level::Level1);
+        limiter.add_to_waiters(handles[4], &s, &lk, Level::Level2);
+        limiter.add_to_waiters(handles[5], &s, &lk, Level::Level2);
+
+        // Release 1 permit for the full L2 path
+        let woken = limiter.release_action_concurrency(&s, &lk);
+        // Should wake exactly 1 from each level, deepest first
+        assert_eq!(woken.len(), 3);
+        assert_eq!(woken[0], handles[4]); // l2 head (deepest, highest priority)
+        assert_eq!(woken[1], handles[2]); // l1 head
+        assert_eq!(woken[2], handles[0]); // scope head (shallowest, lowest priority)
+
+        // Each level still has 1 remaining waiter
+        assert_eq!(limiter.state.scopes[&s].waiters.len(), 1);
+        let l1k = lk.level1().unwrap();
+        assert_eq!(limiter.state.scopes[&s].l1[l1k].waiters.len(), 1);
+        let l2k = lk.level2().unwrap();
+        assert_eq!(limiter.state.scopes[&s].l1[l1k].l2[l2k].waiters.len(), 1);
+    }
+
+    #[test]
+    fn rule_update_upsert_drains_affected_waiters() {
+        let mut limiter = limiter_with_rules(&[("*", 100)]);
+        let (_sm, handles) = make_handles(3);
+        let s = scope("s1");
+
+        // Park waiters at scope level
+        limiter.add_to_waiters(handles[0], &s, &LimitKey::None, Level::Scope);
+        limiter.add_to_waiters(handles[1], &s, &LimitKey::None, Level::Scope);
+
+        // Also park one at L1 level under a different counter
+        let lk = limit_key("foo");
+        limiter.add_to_waiters(handles[2], &s, &lk, Level::Level1);
+
+        // Upsert a scope-level rule: should drain scope waiters only
+        let woken = limiter.apply_rule_update(RuleUpdate::Upsert {
+            pattern: rule("s1"),
+            limit: limits(200),
+        });
+        assert_eq!(woken.len(), 2);
+        assert!(woken.contains(&handles[0]));
+        assert!(woken.contains(&handles[1]));
+
+        // L1 waiter was NOT drained (scope-level rule doesn't affect L1 waiters)
+        let l1k = lk.level1().unwrap();
+        assert_eq!(limiter.state.scopes[&s].l1[l1k].waiters.len(), 1);
+    }
+
+    #[test]
+    fn rule_update_remove_drains_affected_waiters() {
+        let mut limiter = limiter_with_rules(&[("*", 100), ("s1/*/t1", 10)]);
+        let (_sm, handles) = make_handles(4);
+        let s = scope("s1");
+
+        // Park waiters at L2 nodes matching the pattern s1/*/t1
+        let lk1 = limit_key("foo/t1");
+        let lk2 = limit_key("bar/t1");
+        limiter.add_to_waiters(handles[0], &s, &lk1, Level::Level2);
+        limiter.add_to_waiters(handles[1], &s, &lk2, Level::Level2);
+
+        // Park a waiter at L2 for a different l2 key (should NOT be drained)
+        let lk3 = limit_key("foo/t2");
+        limiter.add_to_waiters(handles[2], &s, &lk3, Level::Level2);
+
+        // Park a waiter at scope (should NOT be drained)
+        limiter.add_to_waiters(handles[3], &s, &LimitKey::None, Level::Scope);
+
+        // Remove the L2 rule: should drain L2 waiters matching s1/*/t1
+        let woken = limiter.apply_rule_update(RuleUpdate::Remove {
+            pattern: rule("s1/*/t1"),
+        });
+        assert_eq!(woken.len(), 2);
+        assert!(woken.contains(&handles[0]));
+        assert!(woken.contains(&handles[1]));
+
+        // t2 waiter still there
+        let l1k = lk3.level1().unwrap();
+        let l2k = lk3.level2().unwrap();
+        assert_eq!(limiter.state.scopes[&s].l1[l1k].l2[l2k].waiters.len(), 1);
+
+        // scope waiter still there
+        assert_eq!(limiter.state.scopes[&s].waiters.len(), 1);
+    }
+
+    #[test]
+    fn rule_update_wildcard_scope_drains_all_scopes() {
+        let mut limiter = limiter_with_rules(&[("*", 100)]);
+        let (_sm, handles) = make_handles(3);
+
+        // Park waiters at different scope nodes
+        limiter.add_to_waiters(handles[0], &scope("s1"), &LimitKey::None, Level::Scope);
+        limiter.add_to_waiters(handles[1], &scope("s2"), &LimitKey::None, Level::Scope);
+        limiter.add_to_waiters(handles[2], &scope("s3"), &LimitKey::None, Level::Scope);
+
+        // Update wildcard scope rule: should drain ALL scope waiters
+        let woken = limiter.apply_rule_update(RuleUpdate::Upsert {
+            pattern: rule("*"),
+            limit: limits(200),
+        });
+        assert_eq!(woken.len(), 3);
+    }
+}
diff --git a/util/string/src/restricted_value.rs b/util/string/src/restricted_value.rs
index 19d04e0b8a..efe4948842 100644
--- a/util/string/src/restricted_value.rs
+++ b/util/string/src/restricted_value.rs
@@ -203,6 +203,13 @@ impl<S: StringLike> std::ops::Deref for RestrictedValue<S> {
     }
 }
 
+// Needed for hashbrown's entry_ref API to lazily convert the key reference on insert.
+impl<S: Clone> From<&RestrictedValue<S>> for RestrictedValue<S> {
+    fn from(value: &RestrictedValue<S>) -> Self {
+        value.clone()
+    }
+}
+
 impl<S: OwnedStringLike> FromStr for RestrictedValue<S> {
     type Err = RestrictedValueError;
 
diff --git a/workspace-hack/Cargo.toml b/workspace-hack/Cargo.toml
index b9d312e691..f7a859c529 100644
--- a/workspace-hack/Cargo.toml
+++ b/workspace-hack/Cargo.toml
@@ -18,6 +18,7 @@ publish = false
 [dependencies]
 adaptive-timeout = { version = "0.0.1-alpha.4", features = ["schemars", "serde", "sync", "tokio"] }
 ahash = { version = "0.8", features = ["serde"] }
+arrayvec = { version = "0.7" }
 arrow = { version = "57", features = ["chrono-tz", "prettyprint"] }
 arrow-array = { version = "57", default-features = false, features = ["chrono-tz"] }
 arrow-cast = { version = "57", default-features = false, features = ["prettyprint"] }
@@ -145,6 +146,7 @@ zstd-sys = { version = "2", features = ["experimental", "std"] }
 [build-dependencies]
 adaptive-timeout = { version = "0.0.1-alpha.4", features = ["schemars", "serde", "sync", "tokio"] }
 ahash = { version = "0.8", features = ["serde"] }
+arrayvec = { version = "0.7" }
 arrow = { version = "57", features = ["chrono-tz", "prettyprint"] }
 arrow-array = { version = "57", default-features = false, features = ["chrono-tz"] }
 arrow-cast = { version = "57", default-features = false, features = ["prettyprint"] }