From 3309c28b963a39c72f334d2bd746cf75a752e632 Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Tue, 9 Dec 2025 18:17:39 +0000
Subject: [PATCH 01/10] Initial plan


From d90cb2a5aaf9acfbb3c6905843bccb2dc6819170 Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Tue, 9 Dec 2025 18:26:40 +0000
Subject: [PATCH 02/10] Implement background JWKS refresh infrastructure

Co-authored-by: bbockelm <1093447+bbockelm@users.noreply.github.com>
---
 CMakeLists.txt             |  5 +-
 src/scitokens.cpp          | 58 ++++++++++++++++++++++++
 src/scitokens.h            | 19 ++++++++
 src/scitokens_internal.cpp | 93 ++++++++++++++++++++++++++++++++++++++
 src/scitokens_internal.h   | 65 ++++++++++++++++++++++++++
 5 files changed, 239 insertions(+), 1 deletion(-)

diff --git a/CMakeLists.txt b/CMakeLists.txt
index 93973fb..ec6d2b2 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -48,7 +48,10 @@ add_library(SciTokens SHARED src/scitokens.cpp src/scitokens_internal.cpp src/sc
 target_compile_features(SciTokens PUBLIC cxx_std_11) # Use at least C++11 for building and when linking to scitokens
 target_include_directories(SciTokens PUBLIC ${JWT_CPP_INCLUDES} "${PROJECT_SOURCE_DIR}/src" PRIVATE ${CURL_INCLUDE_DIRS} ${OPENSSL_INCLUDE_DIRS} ${LIBCRYPTO_INCLUDE_DIRS} ${SQLITE_INCLUDE_DIRS}  ${UUID_INCLUDE_DIRS})
 
-target_link_libraries(SciTokens PUBLIC ${OPENSSL_LIBRARIES} ${LIBCRYPTO_LIBRARIES} ${CURL_LIBRARIES} ${SQLITE_LIBRARIES} ${UUID_LIBRARIES})
+# Find threading library
+find_package(Threads REQUIRED)
+
+target_link_libraries(SciTokens PUBLIC ${OPENSSL_LIBRARIES} ${LIBCRYPTO_LIBRARIES} ${CURL_LIBRARIES} ${SQLITE_LIBRARIES} ${UUID_LIBRARIES} Threads::Threads)
 if (UNIX)
 # pkg_check_modules fails to return an absolute path on RHEL7.  Set the
 # link directories accordingly.
diff --git a/src/scitokens.cpp b/src/scitokens.cpp
index 1d53f16..6abb264 100644
--- a/src/scitokens.cpp
+++ b/src/scitokens.cpp
@@ -49,6 +49,11 @@ int configurer::Configuration::get_monitoring_file_interval() {
     return m_monitoring_file_interval;
 }
 
+// Background refresh config
+std::atomic_bool configurer::Configuration::m_background_refresh_enabled{false};
+std::atomic_int configurer::Configuration::m_refresh_interval{60000};     // 60 seconds
+std::atomic_int configurer::Configuration::m_refresh_threshold{600000};   // 10 minutes
+
 SciTokenKey scitoken_key_create(const char *key_id, const char *alg,
                                 const char *public_contents,
                                 const char *private_contents, char **err_msg) {
@@ -1020,6 +1025,29 @@ int keycache_set_jwks(const char *issuer, const char *jwks, char **err_msg) {
     return 0;
 }
 
+int keycache_set_background_refresh(int enabled, char **err_msg) {
+    try {
+        bool enable = (enabled != 0);
+        configurer::Configuration::set_background_refresh_enabled(enable);
+        
+        if (enable) {
+            scitokens::internal::BackgroundRefreshManager::get_instance().start();
+        } else {
+            scitokens::internal::BackgroundRefreshManager::get_instance().stop();
+        }
+    } catch (std::exception &exc) {
+        if (err_msg) {
+            *err_msg = strdup(exc.what());
+        }
+        return -1;
+    }
+    return 0;
+}
+
+int keycache_stop_background_refresh(char **err_msg) {
+    return keycache_set_background_refresh(0, err_msg);
+}
+
 int config_set_int(const char *key, int value, char **err_msg) {
     return scitoken_config_set_int(key, value, err_msg);
 }
@@ -1066,6 +1094,28 @@ int scitoken_config_set_int(const char *key, int value, char **err_msg) {
         return 0;
     }
 
+    else if (_key == "keycache.refresh_interval_ms") {
+        if (value < 0) {
+            if (err_msg) {
+                *err_msg = strdup("Refresh interval must be positive.");
+            }
+            return -1;
+        }
+        configurer::Configuration::set_refresh_interval(value);
+        return 0;
+    }
+
+    else if (_key == "keycache.refresh_threshold_ms") {
+        if (value < 0) {
+            if (err_msg) {
+                *err_msg = strdup("Refresh threshold must be positive.");
+            }
+            return -1;
+        }
+        configurer::Configuration::set_refresh_threshold(value);
+        return 0;
+    }
+
     else {
         if (err_msg) {
             *err_msg = strdup("Key not recognized.");
@@ -1099,6 +1149,14 @@ int scitoken_config_get_int(const char *key, char **err_msg) {
         return configurer::Configuration::get_monitoring_file_interval();
     }
 
+    else if (_key == "keycache.refresh_interval_ms") {
+        return configurer::Configuration::get_refresh_interval();
+    }
+
+    else if (_key == "keycache.refresh_threshold_ms") {
+        return configurer::Configuration::get_refresh_threshold();
+    }
+
     else {
         if (err_msg) {
             *err_msg = strdup("Key not recognized.");
diff --git a/src/scitokens.h b/src/scitokens.h
index cdf3953..a2e8256 100644
--- a/src/scitokens.h
+++ b/src/scitokens.h
@@ -290,6 +290,25 @@ int keycache_get_cached_jwks(const char *issuer, char **jwks, char **err_msg);
  */
 int keycache_set_jwks(const char *issuer, const char *jwks, char **err_msg);
 
+/**
+ * Enable or disable the background refresh thread for JWKS.
+ * - When enabled, a background thread will periodically check if any known
+ *   issuers need their JWKS refreshed based on the configured refresh interval
+ *   and threshold.
+ * - If enabled=1 and the thread is not running, it will be started.
+ * - If enabled=0 and the thread is running, it will be stopped gracefully.
+ * - Returns 0 on success, nonzero on failure.
+ */
+int keycache_set_background_refresh(int enabled, char **err_msg);
+
+/**
+ * Stop the background refresh thread if it is running.
+ * - This is a convenience function equivalent to
+ *   keycache_set_background_refresh(0, err_msg).
+ * - Returns 0 on success, nonzero on failure.
+ */
+int keycache_stop_background_refresh(char **err_msg);
+
 /**
  * APIs for managing scitokens configuration parameters.
  */
diff --git a/src/scitokens_internal.cpp b/src/scitokens_internal.cpp
index 15a74a4..e5610a8 100644
--- a/src/scitokens_internal.cpp
+++ b/src/scitokens_internal.cpp
@@ -39,6 +39,94 @@ namespace scitokens {
 
 namespace internal {
 
+// BackgroundRefreshManager implementation
+void BackgroundRefreshManager::start() {
+    if (m_running) {
+        return;  // Already running
+    }
+
+    std::call_once(m_start_once, [this]() {
+        m_shutdown = false;
+        m_running = true;
+        m_thread = std::make_unique<std::thread>(&BackgroundRefreshManager::refresh_loop, this);
+    });
+}
+
+void BackgroundRefreshManager::stop() {
+    if (!m_running) {
+        return;  // Not running
+    }
+
+    m_shutdown = true;
+    m_cv.notify_all();
+
+    if (m_thread && m_thread->joinable()) {
+        m_thread->join();
+    }
+    m_running = false;
+}
+
+void BackgroundRefreshManager::add_issuer(const std::string &issuer) {
+    std::lock_guard<std::mutex> lock(m_mutex);
+    m_issuers[issuer] = true;
+}
+
+std::vector<std::string> BackgroundRefreshManager::get_issuers() {
+    std::lock_guard<std::mutex> lock(m_mutex);
+    std::vector<std::string> result;
+    for (const auto &pair : m_issuers) {
+        result.push_back(pair.first);
+    }
+    return result;
+}
+
+void BackgroundRefreshManager::refresh_loop() {
+    while (!m_shutdown) {
+        auto interval = configurer::Configuration::get_refresh_interval();
+        auto threshold = configurer::Configuration::get_refresh_threshold();
+
+        // Wait for the interval or until shutdown
+        {
+            std::unique_lock<std::mutex> lock(m_mutex);
+            m_cv.wait_for(lock, std::chrono::milliseconds(interval),
+                          [this]() { return m_shutdown.load(); });
+        }
+
+        if (m_shutdown) {
+            break;
+        }
+
+        // Get list of issuers to check
+        auto issuers = get_issuers();
+        auto now = std::time(NULL);
+
+        for (const auto &issuer : issuers) {
+            if (m_shutdown) {
+                break;
+            }
+
+            // Check if this issuer needs refresh
+            picojson::value keys;
+            int64_t next_update;
+            if (scitokens::Validator::get_public_keys_from_db(issuer, now, keys, next_update)) {
+                // Calculate time until next_update in milliseconds
+                int64_t time_until_update = (next_update - now) * 1000;
+
+                // If next update is within threshold, try to refresh
+                if (time_until_update <= threshold) {
+                    try {
+                        // Perform refresh (this will use the refresh_jwks method)
+                        scitokens::Validator::refresh_jwks(issuer);
+                    } catch (std::exception &) {
+                        // Ignore errors in background refresh
+                        // In the future, we can track statistics here
+                    }
+                }
+            }
+        }
+    }
+}
+
 SimpleCurlGet::GetStatus SimpleCurlGet::perform_start(const std::string &url) {
     m_len = 0;
 
@@ -868,6 +956,11 @@ Validator::get_public_key_pem(const std::string &issuer, const std::string &kid,
     result->m_issuer = issuer;
     result->m_kid = kid;
 
+    // Track this issuer for background refresh if enabled
+    if (configurer::Configuration::get_background_refresh_enabled()) {
+        internal::BackgroundRefreshManager::get_instance().add_issuer(issuer);
+    }
+
     // Always call the continue because it formats the public_pem and algorithm
     return get_public_key_pem_continue(std::move(result), public_pem,
                                        algorithm);
diff --git a/src/scitokens_internal.h b/src/scitokens_internal.h
index 44bf2a7..4afe7c7 100644
--- a/src/scitokens_internal.h
+++ b/src/scitokens_internal.h
@@ -6,6 +6,8 @@
 #include <unordered_map>
 
 #include <atomic>
+#include <condition_variable>
+#include <thread>
 #include <curl/curl.h>
 #include <jwt-cpp/jwt.h>
 #include <uuid/uuid.h>
@@ -60,6 +62,22 @@ class Configuration {
         return m_monitoring_file_configured.load(std::memory_order_relaxed);
     }
 
+    // Background refresh configuration
+    static void set_background_refresh_enabled(bool enabled) {
+        m_background_refresh_enabled = enabled;
+    }
+    static bool get_background_refresh_enabled() {
+        return m_background_refresh_enabled;
+    }
+    static void set_refresh_interval(int interval_ms) {
+        m_refresh_interval = interval_ms;
+    }
+    static int get_refresh_interval() { return m_refresh_interval; }
+    static void set_refresh_threshold(int threshold_ms) {
+        m_refresh_threshold = threshold_ms;
+    }
+    static int get_refresh_threshold() { return m_refresh_threshold; }
+
   private:
     static std::atomic_int m_next_update_delta;
     static std::atomic_int m_expiry_delta;
@@ -69,6 +87,9 @@ class Configuration {
     static std::mutex m_monitoring_file_mutex;
     static std::atomic<bool> m_monitoring_file_configured; // Fast-path flag
     static std::atomic_int m_monitoring_file_interval; // In seconds, default 60
+    static std::atomic_bool m_background_refresh_enabled;
+    static std::atomic_int m_refresh_interval;    // N milliseconds
+    static std::atomic_int m_refresh_threshold;   // M milliseconds
     // static bool check_dir(const std::string dir_path);
     static std::pair<bool, std::string>
     mkdir_and_parents_if_needed(const std::string dir_path);
@@ -83,6 +104,48 @@ namespace internal {
 // Forward declaration
 class MonitoringStats;
 
+/**
+ * Manages the background thread for refreshing JWKS.
+ * This is a singleton that starts/stops a background thread which periodically
+ * checks if any known issuers need their JWKS refreshed.
+ */
+class BackgroundRefreshManager {
+  public:
+    static BackgroundRefreshManager &get_instance() {
+        static BackgroundRefreshManager instance;
+        return instance;
+    }
+
+    // Start the background refresh thread
+    void start();
+
+    // Stop the background refresh thread
+    void stop();
+
+    // Add an issuer to the list of issuers to monitor
+    void add_issuer(const std::string &issuer);
+
+    // Get all known issuers
+    std::vector<std::string> get_issuers();
+
+  private:
+    BackgroundRefreshManager() = default;
+    ~BackgroundRefreshManager() { stop(); }
+    BackgroundRefreshManager(const BackgroundRefreshManager &) = delete;
+    BackgroundRefreshManager &operator=(const BackgroundRefreshManager &) =
+        delete;
+
+    void refresh_loop();
+
+    std::mutex m_mutex;
+    std::condition_variable m_cv;
+    std::unique_ptr<std::thread> m_thread;
+    std::atomic_bool m_shutdown{false};
+    std::atomic_bool m_running{false};
+    std::once_flag m_start_once;
+    std::unordered_map<std::string, bool> m_issuers;
+};
+
 class SimpleCurlGet {
 
     int m_maxbytes{1048576};
@@ -588,6 +651,8 @@ class SciToken {
 
 class Validator {
 
+    friend class internal::BackgroundRefreshManager;
+
     typedef int (*StringValidatorFunction)(const char *value, char **err_msg);
     typedef bool (*ClaimValidatorFunction)(const jwt::claim &claim_value,
                                            void *data);

From cfc2d16d2ac54b5b532f86be8cbe44f1f038ac8f Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Tue, 9 Dec 2025 18:29:25 +0000
Subject: [PATCH 03/10] Add integration test for background JWKS refresh

Co-authored-by: bbockelm <1093447+bbockelm@users.noreply.github.com>
---
 test/integration_test.cpp | 153 ++++++++++++++++++++++++++++++++++++++
 1 file changed, 153 insertions(+)

diff --git a/test/integration_test.cpp b/test/integration_test.cpp
index 15922cc..4d42a1d 100644
--- a/test/integration_test.cpp
+++ b/test/integration_test.cpp
@@ -1106,6 +1106,159 @@ TEST_F(IntegrationTest, MonitoringFileOutput) {
     std::remove(test_file.c_str());
 }
 
+// =============================================================================
+// Background JWKS Refresh Test
+// =============================================================================
+
+TEST_F(IntegrationTest, BackgroundRefreshTest) {
+    char *err_msg = nullptr;
+
+    // Set smaller intervals for testing (1 second refresh interval, 2 seconds threshold)
+    int rv = scitoken_config_set_int("keycache.refresh_interval_ms", 1000, &err_msg);
+    ASSERT_EQ(rv, 0) << "Failed to set refresh interval: "
+                     << (err_msg ? err_msg : "unknown error");
+    if (err_msg) {
+        free(err_msg);
+        err_msg = nullptr;
+    }
+
+    rv = scitoken_config_set_int("keycache.refresh_threshold_ms", 2000, &err_msg);
+    ASSERT_EQ(rv, 0) << "Failed to set refresh threshold: "
+                     << (err_msg ? err_msg : "unknown error");
+    if (err_msg) {
+        free(err_msg);
+        err_msg = nullptr;
+    }
+
+    // Create a key and token
+    std::unique_ptr<void, decltype(&scitoken_key_destroy)> key(
+        scitoken_key_create("test-key-1", "ES256", public_key_.c_str(),
+                            private_key_.c_str(), &err_msg),
+        scitoken_key_destroy);
+    ASSERT_TRUE(key.get() != nullptr);
+    if (err_msg) {
+        free(err_msg);
+        err_msg = nullptr;
+    }
+
+    std::unique_ptr<void, decltype(&scitoken_destroy)> token(
+        scitoken_create(key.get()), scitoken_destroy);
+    ASSERT_TRUE(token.get() != nullptr);
+
+    rv = scitoken_set_claim_string(token.get(), "iss", issuer_url_.c_str(),
+                                    &err_msg);
+    ASSERT_EQ(rv, 0);
+    if (err_msg) {
+        free(err_msg);
+        err_msg = nullptr;
+    }
+
+    rv = scitoken_set_claim_string(token.get(), "sub", "test-subject", &err_msg);
+    ASSERT_EQ(rv, 0);
+    if (err_msg) {
+        free(err_msg);
+        err_msg = nullptr;
+    }
+
+    rv = scitoken_set_claim_string(token.get(), "scope", "read:/test", &err_msg);
+    ASSERT_EQ(rv, 0);
+    if (err_msg) {
+        free(err_msg);
+        err_msg = nullptr;
+    }
+
+    scitoken_set_lifetime(token.get(), 3600);
+
+    char *token_value = nullptr;
+    rv = scitoken_serialize(token.get(), &token_value, &err_msg);
+    ASSERT_EQ(rv, 0);
+    if (err_msg) {
+        free(err_msg);
+        err_msg = nullptr;
+    }
+    std::unique_ptr<char, decltype(&free)> token_value_ptr(token_value, free);
+
+    // First verification - this will fetch JWKS and track the issuer
+    std::unique_ptr<void, decltype(&scitoken_destroy)> verify_token(
+        scitoken_create(nullptr), scitoken_destroy);
+    ASSERT_TRUE(verify_token.get() != nullptr);
+
+    rv = scitoken_deserialize_v2(token_value, verify_token.get(), nullptr, &err_msg);
+    ASSERT_EQ(rv, 0) << "Failed to verify token: "
+                     << (err_msg ? err_msg : "unknown error");
+    if (err_msg) {
+        free(err_msg);
+        err_msg = nullptr;
+    }
+
+    // Get the current JWKS to verify it exists
+    char *jwks_before = nullptr;
+    rv = keycache_get_cached_jwks(issuer_url_.c_str(), &jwks_before, &err_msg);
+    ASSERT_EQ(rv, 0) << "Failed to get cached JWKS: "
+                     << (err_msg ? err_msg : "unknown error");
+    ASSERT_TRUE(jwks_before != nullptr);
+    std::unique_ptr<char, decltype(&free)> jwks_before_ptr(jwks_before, free);
+    if (err_msg) {
+        free(err_msg);
+        err_msg = nullptr;
+    }
+
+    std::cout << "Initial JWKS fetched successfully" << std::endl;
+
+    // Set update interval to 1 second so keys will need refresh soon
+    rv = scitoken_config_set_int("keycache.update_interval_s", 1, &err_msg);
+    ASSERT_EQ(rv, 0);
+    if (err_msg) {
+        free(err_msg);
+        err_msg = nullptr;
+    }
+
+    // Enable background refresh
+    rv = keycache_set_background_refresh(1, &err_msg);
+    ASSERT_EQ(rv, 0) << "Failed to enable background refresh: "
+                     << (err_msg ? err_msg : "unknown error");
+    if (err_msg) {
+        free(err_msg);
+        err_msg = nullptr;
+    }
+
+    std::cout << "Background refresh enabled" << std::endl;
+
+    // Wait for background refresh to trigger (threshold is 2 seconds, interval is 1 second)
+    // We need to wait at least 3 seconds: 1s for next_update to be within threshold + 2s for detection
+    std::cout << "Waiting 4 seconds for background refresh..." << std::endl;
+    sleep(4);
+
+    // The background refresh should have occurred
+    // We can't easily verify it refreshed without instrumenting the code more,
+    // but we can verify the thread is running and didn't crash
+    
+    // Stop background refresh
+    rv = keycache_stop_background_refresh(&err_msg);
+    ASSERT_EQ(rv, 0) << "Failed to stop background refresh: "
+                     << (err_msg ? err_msg : "unknown error");
+    if (err_msg) {
+        free(err_msg);
+        err_msg = nullptr;
+    }
+
+    std::cout << "Background refresh stopped successfully" << std::endl;
+
+    // Verify we can still access the JWKS
+    char *jwks_after = nullptr;
+    rv = keycache_get_cached_jwks(issuer_url_.c_str(), &jwks_after, &err_msg);
+    ASSERT_EQ(rv, 0) << "Failed to get cached JWKS after background refresh: "
+                     << (err_msg ? err_msg : "unknown error");
+    ASSERT_TRUE(jwks_after != nullptr);
+    std::unique_ptr<char, decltype(&free)> jwks_after_ptr(jwks_after, free);
+    if (err_msg) {
+        free(err_msg);
+        err_msg = nullptr;
+    }
+
+    std::cout << "Test completed successfully" << std::endl;
+}
+
 } // namespace
 
 int main(int argc, char **argv) {

From d7961314050483388b78de0aa4dbaa0c4bb9b478 Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Tue, 9 Dec 2025 18:35:31 +0000
Subject: [PATCH 04/10] Address code review feedback - improve thread safety
 and documentation

Co-authored-by: bbockelm <1093447+bbockelm@users.noreply.github.com>
---
 src/scitokens_internal.cpp | 14 ++++++++------
 src/scitokens_internal.h   |  5 +++++
 test/integration_test.cpp  |  2 ++
 3 files changed, 15 insertions(+), 6 deletions(-)

diff --git a/src/scitokens_internal.cpp b/src/scitokens_internal.cpp
index e5610a8..64c5d78 100644
--- a/src/scitokens_internal.cpp
+++ b/src/scitokens_internal.cpp
@@ -1,4 +1,5 @@
 
+#include <chrono>
 #include <functional>
 #include <memory>
 #include <sstream>
@@ -41,10 +42,7 @@ namespace internal {
 
 // BackgroundRefreshManager implementation
 void BackgroundRefreshManager::start() {
-    if (m_running) {
-        return;  // Already running
-    }
-
+    // call_once ensures this block runs exactly once, even if called from multiple threads
     std::call_once(m_start_once, [this]() {
         m_shutdown = false;
         m_running = true;
@@ -118,8 +116,12 @@ void BackgroundRefreshManager::refresh_loop() {
                         // Perform refresh (this will use the refresh_jwks method)
                         scitokens::Validator::refresh_jwks(issuer);
                     } catch (std::exception &) {
-                        // Ignore errors in background refresh
-                        // In the future, we can track statistics here
+                        // Silently ignore errors in background refresh to avoid
+                        // disrupting the application. Background refresh is a best-effort
+                        // optimization. If it fails, the next token verification will
+                        // trigger a foreground refresh as usual.
+                        // TODO: In future work, track statistics (success/failure counts)
+                        // to monitor refresh health.
                     }
                 }
             }
diff --git a/src/scitokens_internal.h b/src/scitokens_internal.h
index 4afe7c7..77cc233 100644
--- a/src/scitokens_internal.h
+++ b/src/scitokens_internal.h
@@ -836,6 +836,11 @@ class Validator {
 
     std::unique_ptr<AsyncStatus>
     verify_async(const jwt::decoded_jwt<jwt::traits::kazuho_picojson> &jwt) {
+        // Start background refresh thread if configured (using once_flag to ensure it only happens once)
+        if (configurer::Configuration::get_background_refresh_enabled()) {
+            internal::BackgroundRefreshManager::get_instance().start();
+        }
+
         // If token has a typ header claim (RFC8725 Section 3.11), trust that in
         // COMPAT mode.
         if (jwt.has_type()) {
diff --git a/test/integration_test.cpp b/test/integration_test.cpp
index 4d42a1d..75a298f 100644
--- a/test/integration_test.cpp
+++ b/test/integration_test.cpp
@@ -1226,6 +1226,8 @@ TEST_F(IntegrationTest, BackgroundRefreshTest) {
 
     // Wait for background refresh to trigger (threshold is 2 seconds, interval is 1 second)
     // We need to wait at least 3 seconds: 1s for next_update to be within threshold + 2s for detection
+    // Note: Using sleep() is acceptable for integration tests as we're verifying real-time behavior
+    // of the background thread against an actual HTTPS server
     std::cout << "Waiting 4 seconds for background refresh..." << std::endl;
     sleep(4);
 

From e9448864cd7bd4573660336c82a2bb236c7819d2 Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Tue, 9 Dec 2025 19:13:46 +0000
Subject: [PATCH 05/10] Address code review feedback: allow multiple start/stop
 cycles, use database to get issuers

- Remove once_flag from BackgroundRefreshManager, allowing multiple start/stop cycles
- Move once_flag to Validator class for first-time initialization on verification
- Remove issuer tracking (add_issuer, get_issuers, m_issuers map)
- Add get_all_issuers_from_db() method to retrieve issuers from SQLite cache
- Update refresh_loop to query database instead of tracking issuers
- Improve thread safety in start/stop methods with proper mutex handling
- Format code with clang-format

Co-authored-by: bbockelm <1093447+bbockelm@users.noreply.github.com>
---
 src/scitokens.cpp          | 14 ++++--
 src/scitokens_cache.cpp    | 74 +++++++++++++++++++++++++++++
 src/scitokens_internal.cpp | 97 +++++++++++++++++---------------------
 src/scitokens_internal.h   | 43 +++++++++--------
 4 files changed, 151 insertions(+), 77 deletions(-)

diff --git a/src/scitokens.cpp b/src/scitokens.cpp
index 6abb264..f7051a4 100644
--- a/src/scitokens.cpp
+++ b/src/scitokens.cpp
@@ -51,8 +51,10 @@ int configurer::Configuration::get_monitoring_file_interval() {
 
 // Background refresh config
 std::atomic_bool configurer::Configuration::m_background_refresh_enabled{false};
-std::atomic_int configurer::Configuration::m_refresh_interval{60000};     // 60 seconds
-std::atomic_int configurer::Configuration::m_refresh_threshold{600000};   // 10 minutes
+std::atomic_int configurer::Configuration::m_refresh_interval{
+    60000}; // 60 seconds
+std::atomic_int configurer::Configuration::m_refresh_threshold{
+    600000}; // 10 minutes
 
 SciTokenKey scitoken_key_create(const char *key_id, const char *alg,
                                 const char *public_contents,
@@ -1029,11 +1031,13 @@ int keycache_set_background_refresh(int enabled, char **err_msg) {
     try {
         bool enable = (enabled != 0);
         configurer::Configuration::set_background_refresh_enabled(enable);
-        
+
         if (enable) {
-            scitokens::internal::BackgroundRefreshManager::get_instance().start();
+            scitokens::internal::BackgroundRefreshManager::get_instance()
+                .start();
         } else {
-            scitokens::internal::BackgroundRefreshManager::get_instance().stop();
+            scitokens::internal::BackgroundRefreshManager::get_instance()
+                .stop();
         }
     } catch (std::exception &exc) {
         if (err_msg) {
diff --git a/src/scitokens_cache.cpp b/src/scitokens_cache.cpp
index 12536c1..e293e64 100644
--- a/src/scitokens_cache.cpp
+++ b/src/scitokens_cache.cpp
@@ -308,3 +308,77 @@ bool scitokens::Validator::store_public_keys(const std::string &issuer,
     sqlite3_close(db);
     return true;
 }
+
+std::vector<std::pair<std::string, int64_t>>
+scitokens::Validator::get_all_issuers_from_db(int64_t now) {
+    std::vector<std::pair<std::string, int64_t>> result;
+
+    auto cache_fname = get_cache_file();
+    if (cache_fname.size() == 0) {
+        return result;
+    }
+
+    sqlite3 *db;
+    int rc = sqlite3_open(cache_fname.c_str(), &db);
+    if (rc) {
+        sqlite3_close(db);
+        return result;
+    }
+
+    sqlite3_stmt *stmt;
+    rc = sqlite3_prepare_v2(db, "SELECT issuer, keys FROM keycache", -1, &stmt,
+                            NULL);
+    if (rc != SQLITE_OK) {
+        sqlite3_close(db);
+        return result;
+    }
+
+    while ((rc = sqlite3_step(stmt)) == SQLITE_ROW) {
+        const unsigned char *issuer_data = sqlite3_column_text(stmt, 0);
+        const unsigned char *keys_data = sqlite3_column_text(stmt, 1);
+
+        if (!issuer_data || !keys_data) {
+            continue;
+        }
+
+        std::string issuer(reinterpret_cast<const char *>(issuer_data));
+        std::string metadata(reinterpret_cast<const char *>(keys_data));
+
+        // Parse the metadata to get next_update and check expiry
+        picojson::value json_obj;
+        auto err = picojson::parse(json_obj, metadata);
+        if (!err.empty() || !json_obj.is<picojson::object>()) {
+            continue;
+        }
+
+        auto top_obj = json_obj.get<picojson::object>();
+
+        // Check if expired
+        auto expires_iter = top_obj.find("expires");
+        if (expires_iter == top_obj.end() ||
+            !expires_iter->second.is<int64_t>()) {
+            continue;
+        }
+        auto expiry = expires_iter->second.get<int64_t>();
+        if (now > expiry) {
+            continue; // Skip expired entries
+        }
+
+        // Get next_update time
+        auto next_update_iter = top_obj.find("next_update");
+        int64_t next_update;
+        if (next_update_iter == top_obj.end() ||
+            !next_update_iter->second.is<int64_t>()) {
+            // If next_update is not set, default to 4 hours before expiry
+            next_update = expiry - 4 * 3600;
+        } else {
+            next_update = next_update_iter->second.get<int64_t>();
+        }
+
+        result.push_back({issuer, next_update});
+    }
+
+    sqlite3_finalize(stmt);
+    sqlite3_close(db);
+    return result;
+}
diff --git a/src/scitokens_internal.cpp b/src/scitokens_internal.cpp
index 64c5d78..d294de2 100644
--- a/src/scitokens_internal.cpp
+++ b/src/scitokens_internal.cpp
@@ -38,44 +38,42 @@ std::mutex key_refresh_mutex;
 
 namespace scitokens {
 
+// Define the static once_flag for Validator
+std::once_flag Validator::m_background_refresh_once;
+
 namespace internal {
 
 // BackgroundRefreshManager implementation
 void BackgroundRefreshManager::start() {
-    // call_once ensures this block runs exactly once, even if called from multiple threads
-    std::call_once(m_start_once, [this]() {
-        m_shutdown = false;
-        m_running = true;
-        m_thread = std::make_unique<std::thread>(&BackgroundRefreshManager::refresh_loop, this);
-    });
+    std::lock_guard<std::mutex> lock(m_mutex);
+    if (m_running) {
+        return; // Already running
+    }
+    m_shutdown = false;
+    m_running = true;
+    m_thread = std::make_unique<std::thread>(
+        &BackgroundRefreshManager::refresh_loop, this);
 }
 
 void BackgroundRefreshManager::stop() {
-    if (!m_running) {
-        return;  // Not running
-    }
+    std::unique_ptr<std::thread> thread_to_join;
 
-    m_shutdown = true;
-    m_cv.notify_all();
+    {
+        std::lock_guard<std::mutex> lock(m_mutex);
+        if (!m_running) {
+            return; // Not running
+        }
 
-    if (m_thread && m_thread->joinable()) {
-        m_thread->join();
+        m_shutdown = true;
+        m_running = false;
+        thread_to_join = std::move(m_thread);
     }
-    m_running = false;
-}
 
-void BackgroundRefreshManager::add_issuer(const std::string &issuer) {
-    std::lock_guard<std::mutex> lock(m_mutex);
-    m_issuers[issuer] = true;
-}
+    m_cv.notify_all();
 
-std::vector<std::string> BackgroundRefreshManager::get_issuers() {
-    std::lock_guard<std::mutex> lock(m_mutex);
-    std::vector<std::string> result;
-    for (const auto &pair : m_issuers) {
-        result.push_back(pair.first);
+    if (thread_to_join && thread_to_join->joinable()) {
+        thread_to_join->join();
     }
-    return result;
 }
 
 void BackgroundRefreshManager::refresh_loop() {
@@ -94,35 +92,33 @@ void BackgroundRefreshManager::refresh_loop() {
             break;
         }
 
-        // Get list of issuers to check
-        auto issuers = get_issuers();
+        // Get list of issuers from the database
         auto now = std::time(NULL);
+        auto issuers = scitokens::Validator::get_all_issuers_from_db(now);
 
-        for (const auto &issuer : issuers) {
+        for (const auto &issuer_pair : issuers) {
             if (m_shutdown) {
                 break;
             }
 
-            // Check if this issuer needs refresh
-            picojson::value keys;
-            int64_t next_update;
-            if (scitokens::Validator::get_public_keys_from_db(issuer, now, keys, next_update)) {
-                // Calculate time until next_update in milliseconds
-                int64_t time_until_update = (next_update - now) * 1000;
-
-                // If next update is within threshold, try to refresh
-                if (time_until_update <= threshold) {
-                    try {
-                        // Perform refresh (this will use the refresh_jwks method)
-                        scitokens::Validator::refresh_jwks(issuer);
-                    } catch (std::exception &) {
-                        // Silently ignore errors in background refresh to avoid
-                        // disrupting the application. Background refresh is a best-effort
-                        // optimization. If it fails, the next token verification will
-                        // trigger a foreground refresh as usual.
-                        // TODO: In future work, track statistics (success/failure counts)
-                        // to monitor refresh health.
-                    }
+            const auto &issuer = issuer_pair.first;
+            const auto &next_update = issuer_pair.second;
+
+            // Calculate time until next_update in milliseconds
+            int64_t time_until_update = (next_update - now) * 1000;
+
+            // If next update is within threshold, try to refresh
+            if (time_until_update <= threshold) {
+                try {
+                    // Perform refresh (this will use the refresh_jwks method)
+                    scitokens::Validator::refresh_jwks(issuer);
+                } catch (std::exception &) {
+                    // Silently ignore errors in background refresh to avoid
+                    // disrupting the application. Background refresh is a
+                    // best-effort optimization. If it fails, the next token
+                    // verification will trigger a foreground refresh as usual.
+                    // TODO: In future work, track statistics (success/failure
+                    // counts) to monitor refresh health.
                 }
             }
         }
@@ -958,11 +954,6 @@ Validator::get_public_key_pem(const std::string &issuer, const std::string &kid,
     result->m_issuer = issuer;
     result->m_kid = kid;
 
-    // Track this issuer for background refresh if enabled
-    if (configurer::Configuration::get_background_refresh_enabled()) {
-        internal::BackgroundRefreshManager::get_instance().add_issuer(issuer);
-    }
-
     // Always call the continue because it formats the public_pem and algorithm
     return get_public_key_pem_continue(std::move(result), public_pem,
                                        algorithm);
diff --git a/src/scitokens_internal.h b/src/scitokens_internal.h
index 77cc233..9f21350 100644
--- a/src/scitokens_internal.h
+++ b/src/scitokens_internal.h
@@ -7,9 +7,9 @@
 
 #include <atomic>
 #include <condition_variable>
-#include <thread>
 #include <curl/curl.h>
 #include <jwt-cpp/jwt.h>
+#include <thread>
 #include <uuid/uuid.h>
 
 #if defined(__GNUC__)
@@ -88,8 +88,8 @@ class Configuration {
     static std::atomic<bool> m_monitoring_file_configured; // Fast-path flag
     static std::atomic_int m_monitoring_file_interval; // In seconds, default 60
     static std::atomic_bool m_background_refresh_enabled;
-    static std::atomic_int m_refresh_interval;    // N milliseconds
-    static std::atomic_int m_refresh_threshold;   // M milliseconds
+    static std::atomic_int m_refresh_interval;  // N milliseconds
+    static std::atomic_int m_refresh_threshold; // M milliseconds
     // static bool check_dir(const std::string dir_path);
     static std::pair<bool, std::string>
     mkdir_and_parents_if_needed(const std::string dir_path);
@@ -116,24 +116,18 @@ class BackgroundRefreshManager {
         return instance;
     }
 
-    // Start the background refresh thread
+    // Start the background refresh thread (can be called multiple times)
     void start();
 
-    // Stop the background refresh thread
+    // Stop the background refresh thread (can be called multiple times)
     void stop();
 
-    // Add an issuer to the list of issuers to monitor
-    void add_issuer(const std::string &issuer);
-
-    // Get all known issuers
-    std::vector<std::string> get_issuers();
-
   private:
     BackgroundRefreshManager() = default;
     ~BackgroundRefreshManager() { stop(); }
     BackgroundRefreshManager(const BackgroundRefreshManager &) = delete;
-    BackgroundRefreshManager &operator=(const BackgroundRefreshManager &) =
-        delete;
+    BackgroundRefreshManager &
+    operator=(const BackgroundRefreshManager &) = delete;
 
     void refresh_loop();
 
@@ -142,8 +136,6 @@ class BackgroundRefreshManager {
     std::unique_ptr<std::thread> m_thread;
     std::atomic_bool m_shutdown{false};
     std::atomic_bool m_running{false};
-    std::once_flag m_start_once;
-    std::unordered_map<std::string, bool> m_issuers;
 };
 
 class SimpleCurlGet {
@@ -836,10 +828,12 @@ class Validator {
 
     std::unique_ptr<AsyncStatus>
     verify_async(const jwt::decoded_jwt<jwt::traits::kazuho_picojson> &jwt) {
-        // Start background refresh thread if configured (using once_flag to ensure it only happens once)
-        if (configurer::Configuration::get_background_refresh_enabled()) {
-            internal::BackgroundRefreshManager::get_instance().start();
-        }
+        // Start background refresh thread if configured on first verification
+        std::call_once(m_background_refresh_once, []() {
+            if (configurer::Configuration::get_background_refresh_enabled()) {
+                internal::BackgroundRefreshManager::get_instance().start();
+            }
+        });
 
         // If token has a typ header claim (RFC8725 Section 3.11), trust that in
         // COMPAT mode.
@@ -1187,6 +1181,14 @@ class Validator {
      */
     static std::string get_jwks(const std::string &issuer);
 
+    /**
+     * Get all issuers from the database along with their next_update times.
+     * Returns a vector of pairs (issuer, next_update).
+     * Only returns non-expired entries.
+     */
+    static std::vector<std::pair<std::string, int64_t>>
+    get_all_issuers_from_db(int64_t now);
+
   private:
     static std::unique_ptr<AsyncStatus>
     get_public_key_pem(const std::string &issuer, const std::string &kid,
@@ -1257,6 +1259,9 @@ class Validator {
 
     std::vector<std::string> m_critical_claims;
     std::vector<std::string> m_allowed_issuers;
+
+    // Once flag for starting background refresh on first verification
+    static std::once_flag m_background_refresh_once;
 };
 
 class Enforcer {

From d664bee8506a4ca160a1ccb0a0a887fb545be7a7 Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Tue, 9 Dec 2025 20:22:22 +0000
Subject: [PATCH 06/10] Address code review: include expired entries, use
 acquire/release semantics

- Include expired entries in get_all_issuers_from_db() for refresh after long downtime
- Set next_update to now for expired entries so they get refreshed immediately
- Use std::memory_order_acquire/release for all atomic operations instead of sequential consistency
- Improves performance while maintaining proper synchronization guarantees

Co-authored-by: bbockelm <1093447+bbockelm@users.noreply.github.com>
---
 src/scitokens_cache.cpp    | 12 ++++++++----
 src/scitokens_internal.cpp | 23 ++++++++++++-----------
 2 files changed, 20 insertions(+), 15 deletions(-)

diff --git a/src/scitokens_cache.cpp b/src/scitokens_cache.cpp
index e293e64..36173e2 100644
--- a/src/scitokens_cache.cpp
+++ b/src/scitokens_cache.cpp
@@ -353,16 +353,13 @@ scitokens::Validator::get_all_issuers_from_db(int64_t now) {
 
         auto top_obj = json_obj.get<picojson::object>();
 
-        // Check if expired
+        // Get expiry time
         auto expires_iter = top_obj.find("expires");
         if (expires_iter == top_obj.end() ||
             !expires_iter->second.is<int64_t>()) {
             continue;
         }
         auto expiry = expires_iter->second.get<int64_t>();
-        if (now > expiry) {
-            continue; // Skip expired entries
-        }
 
         // Get next_update time
         auto next_update_iter = top_obj.find("next_update");
@@ -375,6 +372,13 @@ scitokens::Validator::get_all_issuers_from_db(int64_t now) {
             next_update = next_update_iter->second.get<int64_t>();
         }
 
+        // Include expired entries - they should be refreshed after a long
+        // downtime If expired, set next_update to now so they get refreshed
+        // immediately
+        if (now > expiry) {
+            next_update = now;
+        }
+
         result.push_back({issuer, next_update});
     }
 
diff --git a/src/scitokens_internal.cpp b/src/scitokens_internal.cpp
index d294de2..5b1acde 100644
--- a/src/scitokens_internal.cpp
+++ b/src/scitokens_internal.cpp
@@ -46,11 +46,11 @@ namespace internal {
 // BackgroundRefreshManager implementation
 void BackgroundRefreshManager::start() {
     std::lock_guard<std::mutex> lock(m_mutex);
-    if (m_running) {
+    if (m_running.load(std::memory_order_acquire)) {
         return; // Already running
     }
-    m_shutdown = false;
-    m_running = true;
+    m_shutdown.store(false, std::memory_order_release);
+    m_running.store(true, std::memory_order_release);
     m_thread = std::make_unique<std::thread>(
         &BackgroundRefreshManager::refresh_loop, this);
 }
@@ -60,12 +60,12 @@ void BackgroundRefreshManager::stop() {
 
     {
         std::lock_guard<std::mutex> lock(m_mutex);
-        if (!m_running) {
+        if (!m_running.load(std::memory_order_acquire)) {
             return; // Not running
         }
 
-        m_shutdown = true;
-        m_running = false;
+        m_shutdown.store(true, std::memory_order_release);
+        m_running.store(false, std::memory_order_release);
         thread_to_join = std::move(m_thread);
     }
 
@@ -77,18 +77,19 @@ void BackgroundRefreshManager::stop() {
 }
 
 void BackgroundRefreshManager::refresh_loop() {
-    while (!m_shutdown) {
+    while (!m_shutdown.load(std::memory_order_acquire)) {
         auto interval = configurer::Configuration::get_refresh_interval();
         auto threshold = configurer::Configuration::get_refresh_threshold();
 
         // Wait for the interval or until shutdown
         {
             std::unique_lock<std::mutex> lock(m_mutex);
-            m_cv.wait_for(lock, std::chrono::milliseconds(interval),
-                          [this]() { return m_shutdown.load(); });
+            m_cv.wait_for(lock, std::chrono::milliseconds(interval), [this]() {
+                return m_shutdown.load(std::memory_order_acquire);
+            });
         }
 
-        if (m_shutdown) {
+        if (m_shutdown.load(std::memory_order_acquire)) {
             break;
         }
 
@@ -97,7 +98,7 @@ void BackgroundRefreshManager::refresh_loop() {
         auto issuers = scitokens::Validator::get_all_issuers_from_db(now);
 
         for (const auto &issuer_pair : issuers) {
-            if (m_shutdown) {
+            if (m_shutdown.load(std::memory_order_acquire)) {
                 break;
             }
 

From 5b0b8626276330f23f4a432dc205ac67c94c510f Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Tue, 9 Dec 2025 20:45:02 +0000
Subject: [PATCH 07/10] Fix clang-format linter issues in integration test

- Apply clang-format to test/integration_test.cpp
- Fix line wrapping and indentation to comply with LLVM style
- No functional changes, only formatting adjustments

Co-authored-by: bbockelm <1093447+bbockelm@users.noreply.github.com>
---
 test/integration_test.cpp | 31 +++++++++++++++++++------------
 1 file changed, 19 insertions(+), 12 deletions(-)

diff --git a/test/integration_test.cpp b/test/integration_test.cpp
index 75a298f..9c7e78f 100644
--- a/test/integration_test.cpp
+++ b/test/integration_test.cpp
@@ -1113,8 +1113,10 @@ TEST_F(IntegrationTest, MonitoringFileOutput) {
 TEST_F(IntegrationTest, BackgroundRefreshTest) {
     char *err_msg = nullptr;
 
-    // Set smaller intervals for testing (1 second refresh interval, 2 seconds threshold)
-    int rv = scitoken_config_set_int("keycache.refresh_interval_ms", 1000, &err_msg);
+    // Set smaller intervals for testing (1 second refresh interval, 2 seconds
+    // threshold)
+    int rv =
+        scitoken_config_set_int("keycache.refresh_interval_ms", 1000, &err_msg);
     ASSERT_EQ(rv, 0) << "Failed to set refresh interval: "
                      << (err_msg ? err_msg : "unknown error");
     if (err_msg) {
@@ -1122,7 +1124,8 @@ TEST_F(IntegrationTest, BackgroundRefreshTest) {
         err_msg = nullptr;
     }
 
-    rv = scitoken_config_set_int("keycache.refresh_threshold_ms", 2000, &err_msg);
+    rv = scitoken_config_set_int("keycache.refresh_threshold_ms", 2000,
+                                 &err_msg);
     ASSERT_EQ(rv, 0) << "Failed to set refresh threshold: "
                      << (err_msg ? err_msg : "unknown error");
     if (err_msg) {
@@ -1146,21 +1149,23 @@ TEST_F(IntegrationTest, BackgroundRefreshTest) {
     ASSERT_TRUE(token.get() != nullptr);
 
     rv = scitoken_set_claim_string(token.get(), "iss", issuer_url_.c_str(),
-                                    &err_msg);
+                                   &err_msg);
     ASSERT_EQ(rv, 0);
     if (err_msg) {
         free(err_msg);
         err_msg = nullptr;
     }
 
-    rv = scitoken_set_claim_string(token.get(), "sub", "test-subject", &err_msg);
+    rv =
+        scitoken_set_claim_string(token.get(), "sub", "test-subject", &err_msg);
     ASSERT_EQ(rv, 0);
     if (err_msg) {
         free(err_msg);
         err_msg = nullptr;
     }
 
-    rv = scitoken_set_claim_string(token.get(), "scope", "read:/test", &err_msg);
+    rv =
+        scitoken_set_claim_string(token.get(), "scope", "read:/test", &err_msg);
     ASSERT_EQ(rv, 0);
     if (err_msg) {
         free(err_msg);
@@ -1183,7 +1188,8 @@ TEST_F(IntegrationTest, BackgroundRefreshTest) {
         scitoken_create(nullptr), scitoken_destroy);
     ASSERT_TRUE(verify_token.get() != nullptr);
 
-    rv = scitoken_deserialize_v2(token_value, verify_token.get(), nullptr, &err_msg);
+    rv = scitoken_deserialize_v2(token_value, verify_token.get(), nullptr,
+                                 &err_msg);
     ASSERT_EQ(rv, 0) << "Failed to verify token: "
                      << (err_msg ? err_msg : "unknown error");
     if (err_msg) {
@@ -1224,17 +1230,18 @@ TEST_F(IntegrationTest, BackgroundRefreshTest) {
 
     std::cout << "Background refresh enabled" << std::endl;
 
-    // Wait for background refresh to trigger (threshold is 2 seconds, interval is 1 second)
-    // We need to wait at least 3 seconds: 1s for next_update to be within threshold + 2s for detection
-    // Note: Using sleep() is acceptable for integration tests as we're verifying real-time behavior
-    // of the background thread against an actual HTTPS server
+    // Wait for background refresh to trigger (threshold is 2 seconds, interval
+    // is 1 second) We need to wait at least 3 seconds: 1s for next_update to be
+    // within threshold + 2s for detection Note: Using sleep() is acceptable for
+    // integration tests as we're verifying real-time behavior of the background
+    // thread against an actual HTTPS server
     std::cout << "Waiting 4 seconds for background refresh..." << std::endl;
     sleep(4);
 
     // The background refresh should have occurred
     // We can't easily verify it refreshed without instrumenting the code more,
     // but we can verify the thread is running and didn't crash
-    
+
     // Stop background refresh
     rv = keycache_stop_background_refresh(&err_msg);
     ASSERT_EQ(rv, 0) << "Failed to stop background refresh: "

From 0c973ffbc34651ab9dfd73fdab4cf2405e945ad6 Mon Sep 17 00:00:00 2001
From: Brian P Bockelman <bockelman@gmail.com>
Date: Wed, 10 Dec 2025 18:44:48 +0000
Subject: [PATCH 08/10] Add background refresh statistics and monitoring
 coordination

- Add background_successful_refreshes and background_failed_refreshes
  counters to IssuerStats for tracking per-issuer background refresh results
- Add is_running() method to BackgroundRefreshManager to check thread state
- Track statistics in refresh_loop() when JWKS refresh succeeds or fails
- Add maybe_write_monitoring_file_from_verify() that skips file writes when
  background refresh thread is running (to avoid redundant writes)
- Write monitoring file from background thread at end of each refresh cycle
- Update get_json() to include new background refresh statistics
- Update integration test to verify background refresh via monitoring API
  using keycache_set_jwks() to force cache entry with short update interval
---
 src/scitokens_internal.cpp   | 11 ++++-
 src/scitokens_internal.h     | 30 +++++++++++--
 src/scitokens_monitoring.cpp | 15 +++++++
 test/integration_test.cpp    | 84 ++++++++++++++++++++++++++++++++----
 4 files changed, 126 insertions(+), 14 deletions(-)

diff --git a/src/scitokens_internal.cpp b/src/scitokens_internal.cpp
index 5b1acde..82e8c2e 100644
--- a/src/scitokens_internal.cpp
+++ b/src/scitokens_internal.cpp
@@ -110,19 +110,26 @@ void BackgroundRefreshManager::refresh_loop() {
 
             // If next update is within threshold, try to refresh
             if (time_until_update <= threshold) {
+                auto &stats =
+                    MonitoringStats::instance().get_issuer_stats(issuer);
                 try {
                     // Perform refresh (this will use the refresh_jwks method)
                     scitokens::Validator::refresh_jwks(issuer);
+                    stats.inc_background_successful_refresh();
                 } catch (std::exception &) {
+                    // Track failed refresh attempts
+                    stats.inc_background_failed_refresh();
                     // Silently ignore errors in background refresh to avoid
                     // disrupting the application. Background refresh is a
                     // best-effort optimization. If it fails, the next token
                     // verification will trigger a foreground refresh as usual.
-                    // TODO: In future work, track statistics (success/failure
-                    // counts) to monitor refresh health.
                 }
             }
         }
+
+        // Write monitoring file from background thread if configured
+        // This avoids writing from verify() when background thread is running
+        MonitoringStats::instance().maybe_write_monitoring_file();
     }
 }
 
diff --git a/src/scitokens_internal.h b/src/scitokens_internal.h
index 9f21350..7520c1d 100644
--- a/src/scitokens_internal.h
+++ b/src/scitokens_internal.h
@@ -122,6 +122,11 @@ class BackgroundRefreshManager {
     // Stop the background refresh thread (can be called multiple times)
     void stop();
 
+    // Check if the background refresh thread is running
+    bool is_running() const {
+        return m_running.load(std::memory_order_acquire);
+    }
+
   private:
     BackgroundRefreshManager() = default;
     ~BackgroundRefreshManager() { stop(); }
@@ -216,6 +221,10 @@ struct IssuerStats {
     std::atomic<uint64_t> failed_refreshes{0};
     std::atomic<uint64_t> stale_key_uses{0};
 
+    // Background refresh statistics (tracked by background thread)
+    std::atomic<uint64_t> background_successful_refreshes{0};
+    std::atomic<uint64_t> background_failed_refreshes{0};
+
     // Increment methods for atomic counters
     void inc_successful_validation() { successful_validations++; }
     void inc_unsuccessful_validation() { unsuccessful_validations++; }
@@ -227,6 +236,10 @@ struct IssuerStats {
     void inc_expired_key() { expired_keys++; }
     void inc_successful_key_lookup() { successful_key_lookups++; }
     void inc_failed_key_lookup() { failed_key_lookups++; }
+    void inc_background_successful_refresh() {
+        background_successful_refreshes++;
+    }
+    void inc_background_failed_refresh() { background_failed_refreshes++; }
 
     // Time setters that accept std::chrono::duration
     template <typename Rep, typename Period>
@@ -321,6 +334,13 @@ class MonitoringStats {
      */
     void maybe_write_monitoring_file() noexcept;
 
+    /**
+     * Same as maybe_write_monitoring_file(), but skips if background refresh
+     * thread is running. This should be called from verify() routines to
+     * avoid redundant writes when the background thread is handling them.
+     */
+    void maybe_write_monitoring_file_from_verify() noexcept;
+
   private:
     MonitoringStats() = default;
     ~MonitoringStats() = default;
@@ -674,8 +694,9 @@ class Validator {
 
     void verify(const SciToken &scitoken, time_t expiry_time) {
         // Check if monitoring file should be written (fast-path, relaxed
-        // atomic)
-        internal::MonitoringStats::instance().maybe_write_monitoring_file();
+        // atomic). Skip if background thread is running.
+        internal::MonitoringStats::instance()
+            .maybe_write_monitoring_file_from_verify();
 
         std::string issuer = "";
         auto start_time = std::chrono::steady_clock::now();
@@ -770,8 +791,9 @@ class Validator {
 
     void verify(const jwt::decoded_jwt<jwt::traits::kazuho_picojson> &jwt) {
         // Check if monitoring file should be written (fast-path, relaxed
-        // atomic)
-        internal::MonitoringStats::instance().maybe_write_monitoring_file();
+        // atomic). Skip if background thread is running.
+        internal::MonitoringStats::instance()
+            .maybe_write_monitoring_file_from_verify();
 
         std::string issuer = "";
         auto start_time = std::chrono::steady_clock::now();
diff --git a/src/scitokens_monitoring.cpp b/src/scitokens_monitoring.cpp
index b264287..0a019c3 100644
--- a/src/scitokens_monitoring.cpp
+++ b/src/scitokens_monitoring.cpp
@@ -121,6 +121,12 @@ std::string MonitoringStats::get_json() const {
         issuer_obj["stale_key_uses"] =
             picojson::value(static_cast<double>(stats.stale_key_uses.load()));
 
+        // Background refresh statistics
+        issuer_obj["background_successful_refreshes"] = picojson::value(
+            static_cast<double>(stats.background_successful_refreshes.load()));
+        issuer_obj["background_failed_refreshes"] = picojson::value(
+            static_cast<double>(stats.background_failed_refreshes.load()));
+
         std::string sanitized_issuer = sanitize_issuer_for_json(issuer);
         issuers_obj[sanitized_issuer] = picojson::value(issuer_obj);
     }
@@ -190,6 +196,15 @@ void MonitoringStats::maybe_write_monitoring_file() noexcept {
     }
 }
 
+void MonitoringStats::maybe_write_monitoring_file_from_verify() noexcept {
+    // If background refresh thread is running, it will handle the writes
+    // This avoids redundant writes and potential contention
+    if (BackgroundRefreshManager::get_instance().is_running()) {
+        return;
+    }
+    maybe_write_monitoring_file();
+}
+
 void MonitoringStats::write_monitoring_file_impl() noexcept {
     try {
         std::string monitoring_file =
diff --git a/test/integration_test.cpp b/test/integration_test.cpp
index 9c7e78f..e07f444 100644
--- a/test/integration_test.cpp
+++ b/test/integration_test.cpp
@@ -39,6 +39,9 @@ class MonitoringStats {
         uint64_t expired_keys{0};
         uint64_t failed_refreshes{0};
         uint64_t stale_key_uses{0};
+        // Background refresh statistics
+        uint64_t background_successful_refreshes{0};
+        uint64_t background_failed_refreshes{0};
     };
 
     struct FailedIssuerLookup {
@@ -157,6 +160,19 @@ class MonitoringStats {
                             static_cast<uint64_t>(it->second.get<double>());
                     }
 
+                    // Background refresh statistics
+                    it = stats_obj.find("background_successful_refreshes");
+                    if (it != stats_obj.end() && it->second.is<double>()) {
+                        stats.background_successful_refreshes =
+                            static_cast<uint64_t>(it->second.get<double>());
+                    }
+
+                    it = stats_obj.find("background_failed_refreshes");
+                    if (it != stats_obj.end() && it->second.is<double>()) {
+                        stats.background_failed_refreshes =
+                            static_cast<uint64_t>(it->second.get<double>());
+                    }
+
                     issuers_[issuer_entry.first] = stats;
                 }
             }
@@ -1113,6 +1129,13 @@ TEST_F(IntegrationTest, MonitoringFileOutput) {
 TEST_F(IntegrationTest, BackgroundRefreshTest) {
     char *err_msg = nullptr;
 
+    // Reset monitoring stats to get a clean baseline
+    scitoken_reset_monitoring_stats(&err_msg);
+    if (err_msg) {
+        free(err_msg);
+        err_msg = nullptr;
+    }
+
     // Set smaller intervals for testing (1 second refresh interval, 2 seconds
     // threshold)
     int rv =
@@ -1133,6 +1156,16 @@ TEST_F(IntegrationTest, BackgroundRefreshTest) {
         err_msg = nullptr;
     }
 
+    // Set update interval to 1 second BEFORE first verification so the
+    // cache entry will have next_update just 1 second in the future.
+    // This ensures the background thread can refresh within the test window.
+    rv = scitoken_config_set_int("keycache.update_interval_s", 1, &err_msg);
+    ASSERT_EQ(rv, 0);
+    if (err_msg) {
+        free(err_msg);
+        err_msg = nullptr;
+    }
+
     // Create a key and token
     std::unique_ptr<void, decltype(&scitoken_key_destroy)> key(
         scitoken_key_create("test-key-1", "ES256", public_key_.c_str(),
@@ -1203,7 +1236,6 @@ TEST_F(IntegrationTest, BackgroundRefreshTest) {
     ASSERT_EQ(rv, 0) << "Failed to get cached JWKS: "
                      << (err_msg ? err_msg : "unknown error");
     ASSERT_TRUE(jwks_before != nullptr);
-    std::unique_ptr<char, decltype(&free)> jwks_before_ptr(jwks_before, free);
     if (err_msg) {
         free(err_msg);
         err_msg = nullptr;
@@ -1211,14 +1243,30 @@ TEST_F(IntegrationTest, BackgroundRefreshTest) {
 
     std::cout << "Initial JWKS fetched successfully" << std::endl;
 
-    // Set update interval to 1 second so keys will need refresh soon
-    rv = scitoken_config_set_int("keycache.update_interval_s", 1, &err_msg);
-    ASSERT_EQ(rv, 0);
+    // Re-set the JWKS to force a fresh cache entry with the current
+    // update_interval (1 second). This ensures next_update is just 1 second
+    // in the future so the background thread will refresh it.
+    rv = keycache_set_jwks(issuer_url_.c_str(), jwks_before, &err_msg);
+    ASSERT_EQ(rv, 0) << "Failed to set JWKS: "
+                     << (err_msg ? err_msg : "unknown error");
+    free(jwks_before);
     if (err_msg) {
         free(err_msg);
         err_msg = nullptr;
     }
 
+    std::cout << "JWKS re-set with 1-second update interval" << std::endl;
+
+    // Get monitoring stats before background refresh
+    auto before_stats = getCurrentMonitoringStats();
+    auto before_issuer_stats = before_stats.getIssuerStats(issuer_url_);
+    std::cout << "Before background refresh:" << std::endl;
+    std::cout << "  background_successful_refreshes: "
+              << before_issuer_stats.background_successful_refreshes
+              << std::endl;
+    std::cout << "  background_failed_refreshes: "
+              << before_issuer_stats.background_failed_refreshes << std::endl;
+
     // Enable background refresh
     rv = keycache_set_background_refresh(1, &err_msg);
     ASSERT_EQ(rv, 0) << "Failed to enable background refresh: "
@@ -1238,10 +1286,6 @@ TEST_F(IntegrationTest, BackgroundRefreshTest) {
     std::cout << "Waiting 4 seconds for background refresh..." << std::endl;
     sleep(4);
 
-    // The background refresh should have occurred
-    // We can't easily verify it refreshed without instrumenting the code more,
-    // but we can verify the thread is running and didn't crash
-
     // Stop background refresh
     rv = keycache_stop_background_refresh(&err_msg);
     ASSERT_EQ(rv, 0) << "Failed to stop background refresh: "
@@ -1265,6 +1309,30 @@ TEST_F(IntegrationTest, BackgroundRefreshTest) {
         err_msg = nullptr;
     }
 
+    // Verify that background refresh statistics increased for our issuer
+    auto after_stats = getCurrentMonitoringStats();
+    auto after_issuer_stats = after_stats.getIssuerStats(issuer_url_);
+
+    std::cout << "After background refresh:" << std::endl;
+    std::cout << "  background_successful_refreshes: "
+              << after_issuer_stats.background_successful_refreshes
+              << std::endl;
+    std::cout << "  background_failed_refreshes: "
+              << after_issuer_stats.background_failed_refreshes << std::endl;
+
+    // The background thread should have performed at least one refresh
+    // for our issuer (either successful or failed)
+    uint64_t total_background_refreshes =
+        after_issuer_stats.background_successful_refreshes +
+        after_issuer_stats.background_failed_refreshes;
+    uint64_t before_total =
+        before_issuer_stats.background_successful_refreshes +
+        before_issuer_stats.background_failed_refreshes;
+
+    EXPECT_GT(total_background_refreshes, before_total)
+        << "Background refresh thread should have performed at least one "
+           "refresh attempt for our issuer";
+
     std::cout << "Test completed successfully" << std::endl;
 }
 

From 8c1603fa432cf8ac9aa144a341ba9432e657fefe Mon Sep 17 00:00:00 2001
From: Brian P Bockelman <bockelman@gmail.com>
Date: Wed, 10 Dec 2025 19:26:21 +0000
Subject: [PATCH 09/10] Use int64_t for integer statistics in JSON output

- Change MonitoringStats::get_json() to cast integer counters to int64_t
  instead of double for proper integer representation in JSON
- Update monitoring_test.cpp to parse integer fields using is<int64_t>()
  and get<int64_t>() instead of double
- Use memory_order_relaxed for atomic loads in get_json() since these
  are read-only statistics snapshots
---
 src/scitokens.cpp            | 11 +++--
 src/scitokens.h              |  8 ++++
 src/scitokens_internal.h     | 90 ++++++++++++++++++++++++------------
 src/scitokens_monitoring.cpp | 46 ++++++++++--------
 test/monitoring_test.cpp     | 44 +++++++++---------
 5 files changed, 125 insertions(+), 74 deletions(-)

diff --git a/src/scitokens.cpp b/src/scitokens.cpp
index b3c1d25..0919bcc 100644
--- a/src/scitokens.cpp
+++ b/src/scitokens.cpp
@@ -43,14 +43,17 @@ void load_config_from_environment() {
         bool is_int;
     };
 
-    const std::array<ConfigMapping, 6> known_configs = {
+    const std::array<ConfigMapping, 8> known_configs = {
         {{"keycache.update_interval_s", "KEYCACHE_UPDATE_INTERVAL_S", true},
          {"keycache.expiration_interval_s", "KEYCACHE_EXPIRATION_INTERVAL_S",
           true},
          {"keycache.cache_home", "KEYCACHE_CACHE_HOME", false},
          {"tls.ca_file", "TLS_CA_FILE", false},
          {"monitoring.file", "MONITORING_FILE", false},
-         {"monitoring.file_interval_s", "MONITORING_FILE_INTERVAL_S", true}}};
+         {"monitoring.file_interval_s", "MONITORING_FILE_INTERVAL_S", true},
+         {"keycache.refresh_interval_ms", "KEYCACHE_REFRESH_INTERVAL_MS", true},
+         {"keycache.refresh_threshold_ms", "KEYCACHE_REFRESH_THRESHOLD_MS",
+          true}}};
 
     const char *prefix = "SCITOKEN_CONFIG_";
 
@@ -130,9 +133,9 @@ int configurer::Configuration::get_monitoring_file_interval() {
 
 // Background refresh config
 std::atomic_bool configurer::Configuration::m_background_refresh_enabled{false};
-std::atomic_int configurer::Configuration::m_refresh_interval{
+std::atomic_int configurer::Configuration::m_refresh_interval_ms{
     60000}; // 60 seconds
-std::atomic_int configurer::Configuration::m_refresh_threshold{
+std::atomic_int configurer::Configuration::m_refresh_threshold_ms{
     600000}; // 10 minutes
 
 SciTokenKey scitoken_key_create(const char *key_id, const char *alg,
diff --git a/src/scitokens.h b/src/scitokens.h
index a2e8256..88dcc68 100644
--- a/src/scitokens.h
+++ b/src/scitokens.h
@@ -327,6 +327,10 @@ int config_set_int(const char *key, int value, char **err_msg);
  * - "keycache.expiration_interval_s": Key cache expiration time (seconds)
  * - "monitoring.file_interval_s": Interval between monitoring file writes
  * (seconds, default 60)
+ * - "keycache.refresh_interval_ms": Background refresh thread check interval
+ * (milliseconds, default 60000)
+ * - "keycache.refresh_threshold_ms": Time before next_update when background
+ * refresh triggers (milliseconds, default 600000)
  */
 int scitoken_config_set_int(const char *key, int value, char **err_msg);
 
@@ -344,6 +348,10 @@ int config_get_int(const char *key, char **err_msg);
  * - "keycache.expiration_interval_s": Key cache expiration time (seconds)
  * - "monitoring.file_interval_s": Interval between monitoring file writes
  * (seconds, default 60)
+ * - "keycache.refresh_interval_ms": Background refresh thread check interval
+ * (milliseconds, default 60000)
+ * - "keycache.refresh_threshold_ms": Time before next_update when background
+ * refresh triggers (milliseconds, default 600000)
  */
 int scitoken_config_get_int(const char *key, char **err_msg);
 
diff --git a/src/scitokens_internal.h b/src/scitokens_internal.h
index 9fb042c..68f2050 100644
--- a/src/scitokens_internal.h
+++ b/src/scitokens_internal.h
@@ -70,13 +70,13 @@ class Configuration {
         return m_background_refresh_enabled;
     }
     static void set_refresh_interval(int interval_ms) {
-        m_refresh_interval = interval_ms;
+        m_refresh_interval_ms = interval_ms;
     }
-    static int get_refresh_interval() { return m_refresh_interval; }
+    static int get_refresh_interval() { return m_refresh_interval_ms; }
     static void set_refresh_threshold(int threshold_ms) {
-        m_refresh_threshold = threshold_ms;
+        m_refresh_threshold_ms = threshold_ms;
     }
-    static int get_refresh_threshold() { return m_refresh_threshold; }
+    static int get_refresh_threshold() { return m_refresh_threshold_ms; }
 
   private:
     // Accessor functions for construct-on-first-use idiom
@@ -127,8 +127,8 @@ class Configuration {
     static std::atomic<bool> m_monitoring_file_configured; // Fast-path flag
     static std::atomic_int m_monitoring_file_interval; // In seconds, default 60
     static std::atomic_bool m_background_refresh_enabled;
-    static std::atomic_int m_refresh_interval;  // N milliseconds
-    static std::atomic_int m_refresh_threshold; // M milliseconds
+    static std::atomic_int m_refresh_interval_ms;  // N milliseconds
+    static std::atomic_int m_refresh_threshold_ms; // M milliseconds
     // static bool check_dir(const std::string dir_path);
     static std::pair<bool, std::string>
     mkdir_and_parents_if_needed(const std::string dir_path);
@@ -264,35 +264,59 @@ struct IssuerStats {
     std::atomic<uint64_t> background_successful_refreshes{0};
     std::atomic<uint64_t> background_failed_refreshes{0};
 
-    // Increment methods for atomic counters
-    void inc_successful_validation() { successful_validations++; }
-    void inc_unsuccessful_validation() { unsuccessful_validations++; }
-    void inc_expired_token() { expired_tokens++; }
-    void inc_sync_validation_started() { sync_validations_started++; }
-    void inc_async_validation_started() { async_validations_started++; }
-    void inc_stale_key_use() { stale_key_uses++; }
-    void inc_failed_refresh() { failed_refreshes++; }
-    void inc_expired_key() { expired_keys++; }
-    void inc_successful_key_lookup() { successful_key_lookups++; }
-    void inc_failed_key_lookup() { failed_key_lookups++; }
+    // Increment methods for atomic counters (use relaxed ordering for stats)
+    void inc_successful_validation() {
+        successful_validations.fetch_add(1, std::memory_order_relaxed);
+    }
+    void inc_unsuccessful_validation() {
+        unsuccessful_validations.fetch_add(1, std::memory_order_relaxed);
+    }
+    void inc_expired_token() {
+        expired_tokens.fetch_add(1, std::memory_order_relaxed);
+    }
+    void inc_sync_validation_started() {
+        sync_validations_started.fetch_add(1, std::memory_order_relaxed);
+    }
+    void inc_async_validation_started() {
+        async_validations_started.fetch_add(1, std::memory_order_relaxed);
+    }
+    void inc_stale_key_use() {
+        stale_key_uses.fetch_add(1, std::memory_order_relaxed);
+    }
+    void inc_failed_refresh() {
+        failed_refreshes.fetch_add(1, std::memory_order_relaxed);
+    }
+    void inc_expired_key() {
+        expired_keys.fetch_add(1, std::memory_order_relaxed);
+    }
+    void inc_successful_key_lookup() {
+        successful_key_lookups.fetch_add(1, std::memory_order_relaxed);
+    }
+    void inc_failed_key_lookup() {
+        failed_key_lookups.fetch_add(1, std::memory_order_relaxed);
+    }
     void inc_background_successful_refresh() {
-        background_successful_refreshes++;
+        background_successful_refreshes.fetch_add(1, std::memory_order_relaxed);
+    }
+    void inc_background_failed_refresh() {
+        background_failed_refreshes.fetch_add(1, std::memory_order_relaxed);
     }
-    void inc_background_failed_refresh() { background_failed_refreshes++; }
 
-    // Time setters that accept std::chrono::duration
+    // Time setters that accept std::chrono::duration (use relaxed ordering)
     template <typename Rep, typename Period>
     void add_sync_time(std::chrono::duration<Rep, Period> duration) {
         auto ns =
             std::chrono::duration_cast<std::chrono::nanoseconds>(duration);
-        sync_total_time_ns += static_cast<uint64_t>(ns.count());
+        sync_total_time_ns.fetch_add(static_cast<uint64_t>(ns.count()),
+                                     std::memory_order_relaxed);
     }
 
     template <typename Rep, typename Period>
     void add_async_time(std::chrono::duration<Rep, Period> duration) {
         auto ns =
             std::chrono::duration_cast<std::chrono::nanoseconds>(duration);
-        async_total_time_ns += static_cast<uint64_t>(ns.count());
+        async_total_time_ns.fetch_add(static_cast<uint64_t>(ns.count()),
+                                      std::memory_order_relaxed);
     }
 
     template <typename Rep, typename Period>
@@ -300,21 +324,27 @@ struct IssuerStats {
     add_failed_key_lookup_time(std::chrono::duration<Rep, Period> duration) {
         auto ns =
             std::chrono::duration_cast<std::chrono::nanoseconds>(duration);
-        failed_key_lookup_time_ns += static_cast<uint64_t>(ns.count());
+        failed_key_lookup_time_ns.fetch_add(static_cast<uint64_t>(ns.count()),
+                                            std::memory_order_relaxed);
     }
 
     void inc_failed_key_lookup(std::chrono::nanoseconds duration) {
-        failed_key_lookups++;
-        failed_key_lookup_time_ns += static_cast<uint64_t>(duration.count());
+        failed_key_lookups.fetch_add(1, std::memory_order_relaxed);
+        failed_key_lookup_time_ns.fetch_add(
+            static_cast<uint64_t>(duration.count()), std::memory_order_relaxed);
     }
 
-    // Time getters that return seconds as double
+    // Time getters that return seconds as double (use relaxed ordering)
     double get_sync_time_s() const {
-        return static_cast<double>(sync_total_time_ns.load()) / 1e9;
+        return static_cast<double>(
+                   sync_total_time_ns.load(std::memory_order_relaxed)) /
+               1e9;
     }
 
     double get_async_time_s() const {
-        return static_cast<double>(async_total_time_ns.load()) / 1e9;
+        return static_cast<double>(
+                   async_total_time_ns.load(std::memory_order_relaxed)) /
+               1e9;
     }
 
     double get_total_time_s() const {
@@ -322,7 +352,9 @@ struct IssuerStats {
     }
 
     double get_failed_key_lookup_time_s() const {
-        return static_cast<double>(failed_key_lookup_time_ns.load()) / 1e9;
+        return static_cast<double>(
+                   failed_key_lookup_time_ns.load(std::memory_order_relaxed)) /
+               1e9;
     }
 };
 
diff --git a/src/scitokens_monitoring.cpp b/src/scitokens_monitoring.cpp
index 0a019c3..56c7a4e 100644
--- a/src/scitokens_monitoring.cpp
+++ b/src/scitokens_monitoring.cpp
@@ -85,17 +85,21 @@ std::string MonitoringStats::get_json() const {
 
         picojson::object issuer_obj;
         issuer_obj["successful_validations"] = picojson::value(
-            static_cast<double>(stats.successful_validations.load()));
+            static_cast<int64_t>(stats.successful_validations.load(
+                std::memory_order_relaxed)));
         issuer_obj["unsuccessful_validations"] = picojson::value(
-            static_cast<double>(stats.unsuccessful_validations.load()));
-        issuer_obj["expired_tokens"] =
-            picojson::value(static_cast<double>(stats.expired_tokens.load()));
+            static_cast<int64_t>(stats.unsuccessful_validations.load(
+                std::memory_order_relaxed)));
+        issuer_obj["expired_tokens"] = picojson::value(static_cast<int64_t>(
+            stats.expired_tokens.load(std::memory_order_relaxed)));
 
         // Validation started counters
         issuer_obj["sync_validations_started"] = picojson::value(
-            static_cast<double>(stats.sync_validations_started.load()));
+            static_cast<int64_t>(stats.sync_validations_started.load(
+                std::memory_order_relaxed)));
         issuer_obj["async_validations_started"] = picojson::value(
-            static_cast<double>(stats.async_validations_started.load()));
+            static_cast<int64_t>(stats.async_validations_started.load(
+                std::memory_order_relaxed)));
 
         // Duration tracking
         issuer_obj["sync_total_time_s"] =
@@ -107,25 +111,29 @@ std::string MonitoringStats::get_json() const {
 
         // Web lookup statistics
         issuer_obj["successful_key_lookups"] = picojson::value(
-            static_cast<double>(stats.successful_key_lookups.load()));
-        issuer_obj["failed_key_lookups"] = picojson::value(
-            static_cast<double>(stats.failed_key_lookups.load()));
+            static_cast<int64_t>(stats.successful_key_lookups.load(
+                std::memory_order_relaxed)));
+        issuer_obj["failed_key_lookups"] = picojson::value(static_cast<int64_t>(
+            stats.failed_key_lookups.load(std::memory_order_relaxed)));
         issuer_obj["failed_key_lookup_time_s"] =
             picojson::value(stats.get_failed_key_lookup_time_s());
 
         // Key refresh statistics
-        issuer_obj["expired_keys"] =
-            picojson::value(static_cast<double>(stats.expired_keys.load()));
-        issuer_obj["failed_refreshes"] =
-            picojson::value(static_cast<double>(stats.failed_refreshes.load()));
-        issuer_obj["stale_key_uses"] =
-            picojson::value(static_cast<double>(stats.stale_key_uses.load()));
+        issuer_obj["expired_keys"] = picojson::value(static_cast<int64_t>(
+            stats.expired_keys.load(std::memory_order_relaxed)));
+        issuer_obj["failed_refreshes"] = picojson::value(static_cast<int64_t>(
+            stats.failed_refreshes.load(std::memory_order_relaxed)));
+        issuer_obj["stale_key_uses"] = picojson::value(static_cast<int64_t>(
+            stats.stale_key_uses.load(std::memory_order_relaxed)));
 
         // Background refresh statistics
-        issuer_obj["background_successful_refreshes"] = picojson::value(
-            static_cast<double>(stats.background_successful_refreshes.load()));
+        issuer_obj["background_successful_refreshes"] =
+            picojson::value(static_cast<int64_t>(
+                stats.background_successful_refreshes.load(
+                    std::memory_order_relaxed)));
         issuer_obj["background_failed_refreshes"] = picojson::value(
-            static_cast<double>(stats.background_failed_refreshes.load()));
+            static_cast<int64_t>(stats.background_failed_refreshes.load(
+                std::memory_order_relaxed)));
 
         std::string sanitized_issuer = sanitize_issuer_for_json(issuer);
         issuers_obj[sanitized_issuer] = picojson::value(issuer_obj);
@@ -141,7 +149,7 @@ std::string MonitoringStats::get_json() const {
                 sanitize_issuer_for_json(entry.first);
             picojson::object lookup_stats;
             lookup_stats["count"] =
-                picojson::value(static_cast<double>(entry.second.count));
+                picojson::value(static_cast<int64_t>(entry.second.count));
             lookup_stats["total_time_s"] =
                 picojson::value(entry.second.total_time_s);
             failed_obj[sanitized_issuer] = picojson::value(lookup_stats);
diff --git a/test/monitoring_test.cpp b/test/monitoring_test.cpp
index c27c3b0..327d35b 100644
--- a/test/monitoring_test.cpp
+++ b/test/monitoring_test.cpp
@@ -77,34 +77,34 @@ class MonitoringStats {
                         issuer_entry.second.get<picojson::object>();
 
                     auto it = stats_obj.find("successful_validations");
-                    if (it != stats_obj.end() && it->second.is<double>()) {
+                    if (it != stats_obj.end() && it->second.is<int64_t>()) {
                         stats.successful_validations =
-                            static_cast<uint64_t>(it->second.get<double>());
+                            static_cast<uint64_t>(it->second.get<int64_t>());
                     }
 
                     it = stats_obj.find("unsuccessful_validations");
-                    if (it != stats_obj.end() && it->second.is<double>()) {
+                    if (it != stats_obj.end() && it->second.is<int64_t>()) {
                         stats.unsuccessful_validations =
-                            static_cast<uint64_t>(it->second.get<double>());
+                            static_cast<uint64_t>(it->second.get<int64_t>());
                     }
 
                     it = stats_obj.find("expired_tokens");
-                    if (it != stats_obj.end() && it->second.is<double>()) {
+                    if (it != stats_obj.end() && it->second.is<int64_t>()) {
                         stats.expired_tokens =
-                            static_cast<uint64_t>(it->second.get<double>());
+                            static_cast<uint64_t>(it->second.get<int64_t>());
                     }
 
                     // Validation started counters
                     it = stats_obj.find("sync_validations_started");
-                    if (it != stats_obj.end() && it->second.is<double>()) {
+                    if (it != stats_obj.end() && it->second.is<int64_t>()) {
                         stats.sync_validations_started =
-                            static_cast<uint64_t>(it->second.get<double>());
+                            static_cast<uint64_t>(it->second.get<int64_t>());
                     }
 
                     it = stats_obj.find("async_validations_started");
-                    if (it != stats_obj.end() && it->second.is<double>()) {
+                    if (it != stats_obj.end() && it->second.is<int64_t>()) {
                         stats.async_validations_started =
-                            static_cast<uint64_t>(it->second.get<double>());
+                            static_cast<uint64_t>(it->second.get<int64_t>());
                     }
 
                     // Duration tracking
@@ -126,15 +126,15 @@ class MonitoringStats {
 
                     // Key lookup statistics
                     it = stats_obj.find("successful_key_lookups");
-                    if (it != stats_obj.end() && it->second.is<double>()) {
+                    if (it != stats_obj.end() && it->second.is<int64_t>()) {
                         stats.successful_key_lookups =
-                            static_cast<uint64_t>(it->second.get<double>());
+                            static_cast<uint64_t>(it->second.get<int64_t>());
                     }
 
                     it = stats_obj.find("failed_key_lookups");
-                    if (it != stats_obj.end() && it->second.is<double>()) {
+                    if (it != stats_obj.end() && it->second.is<int64_t>()) {
                         stats.failed_key_lookups =
-                            static_cast<uint64_t>(it->second.get<double>());
+                            static_cast<uint64_t>(it->second.get<int64_t>());
                     }
 
                     it = stats_obj.find("failed_key_lookup_time_s");
@@ -145,21 +145,21 @@ class MonitoringStats {
 
                     // Key refresh statistics
                     it = stats_obj.find("expired_keys");
-                    if (it != stats_obj.end() && it->second.is<double>()) {
+                    if (it != stats_obj.end() && it->second.is<int64_t>()) {
                         stats.expired_keys =
-                            static_cast<uint64_t>(it->second.get<double>());
+                            static_cast<uint64_t>(it->second.get<int64_t>());
                     }
 
                     it = stats_obj.find("failed_refreshes");
-                    if (it != stats_obj.end() && it->second.is<double>()) {
+                    if (it != stats_obj.end() && it->second.is<int64_t>()) {
                         stats.failed_refreshes =
-                            static_cast<uint64_t>(it->second.get<double>());
+                            static_cast<uint64_t>(it->second.get<int64_t>());
                     }
 
                     it = stats_obj.find("stale_key_uses");
-                    if (it != stats_obj.end() && it->second.is<double>()) {
+                    if (it != stats_obj.end() && it->second.is<int64_t>()) {
                         stats.stale_key_uses =
-                            static_cast<uint64_t>(it->second.get<double>());
+                            static_cast<uint64_t>(it->second.get<int64_t>());
                     }
 
                     issuers_[issuer_entry.first] = stats;
@@ -179,9 +179,9 @@ class MonitoringStats {
                     auto &lookup_obj = entry.second.get<picojson::object>();
 
                     auto it = lookup_obj.find("count");
-                    if (it != lookup_obj.end() && it->second.is<double>()) {
+                    if (it != lookup_obj.end() && it->second.is<int64_t>()) {
                         lookup.count =
-                            static_cast<uint64_t>(it->second.get<double>());
+                            static_cast<uint64_t>(it->second.get<int64_t>());
                     }
 
                     it = lookup_obj.find("total_time_s");

From 1b2c830688423433699e63f0221921b759571c39 Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Wed, 10 Dec 2025 19:33:42 +0000
Subject: [PATCH 10/10] Fix clang-format issues in scitokens_monitoring.cpp

- Apply clang-format to fix line wrapping in monitoring statistics code
- Adjust formatting for long picojson::value() calls
- All files now pass clang-format --Werror check

Co-authored-by: bbockelm <1093447+bbockelm@users.noreply.github.com>
---
 src/scitokens_monitoring.cpp | 19 +++++++++----------
 1 file changed, 9 insertions(+), 10 deletions(-)

diff --git a/src/scitokens_monitoring.cpp b/src/scitokens_monitoring.cpp
index 56c7a4e..ad7216f 100644
--- a/src/scitokens_monitoring.cpp
+++ b/src/scitokens_monitoring.cpp
@@ -84,9 +84,9 @@ std::string MonitoringStats::get_json() const {
         const IssuerStats &stats = entry.second;
 
         picojson::object issuer_obj;
-        issuer_obj["successful_validations"] = picojson::value(
-            static_cast<int64_t>(stats.successful_validations.load(
-                std::memory_order_relaxed)));
+        issuer_obj["successful_validations"] =
+            picojson::value(static_cast<int64_t>(
+                stats.successful_validations.load(std::memory_order_relaxed)));
         issuer_obj["unsuccessful_validations"] = picojson::value(
             static_cast<int64_t>(stats.unsuccessful_validations.load(
                 std::memory_order_relaxed)));
@@ -110,9 +110,9 @@ std::string MonitoringStats::get_json() const {
             picojson::value(stats.get_total_time_s());
 
         // Web lookup statistics
-        issuer_obj["successful_key_lookups"] = picojson::value(
-            static_cast<int64_t>(stats.successful_key_lookups.load(
-                std::memory_order_relaxed)));
+        issuer_obj["successful_key_lookups"] =
+            picojson::value(static_cast<int64_t>(
+                stats.successful_key_lookups.load(std::memory_order_relaxed)));
         issuer_obj["failed_key_lookups"] = picojson::value(static_cast<int64_t>(
             stats.failed_key_lookups.load(std::memory_order_relaxed)));
         issuer_obj["failed_key_lookup_time_s"] =
@@ -127,10 +127,9 @@ std::string MonitoringStats::get_json() const {
             stats.stale_key_uses.load(std::memory_order_relaxed)));
 
         // Background refresh statistics
-        issuer_obj["background_successful_refreshes"] =
-            picojson::value(static_cast<int64_t>(
-                stats.background_successful_refreshes.load(
-                    std::memory_order_relaxed)));
+        issuer_obj["background_successful_refreshes"] = picojson::value(
+            static_cast<int64_t>(stats.background_successful_refreshes.load(
+                std::memory_order_relaxed)));
         issuer_obj["background_failed_refreshes"] = picojson::value(
             static_cast<int64_t>(stats.background_failed_refreshes.load(
                 std::memory_order_relaxed)));