diff --git a/controllers/llamaCPP.h b/controllers/llamaCPP.h index c1017c757..b7b2b27b0 100644 --- a/controllers/llamaCPP.h +++ b/controllers/llamaCPP.h @@ -1537,6 +1537,7 @@ struct llama_server_context { "cache\n"); kv_cache_clear(); } + std::this_thread::sleep_for(std::chrono::milliseconds(5)); // TODO: Need to implement queueing using CV for better performance // std::unique_lock lock(mutex_tasks); // condition_tasks.wait(lock, [&] { return !queue_tasks.empty(); });