thread_system/autoscaler_8cpp_source.html

// BSD 3-Clause License

// Copyright (c) 2024, 🍀☀🌕🌥 🌊

// See the LICENSE file in the project root for full license information.


#include <kcenon/thread/scaling/autoscaler.h>

#include <kcenon/thread/core/thread_pool.h>

#include <kcenon/thread/core/thread_worker.h>

#include <kcenon/thread/utils/formatter.h>


#include <algorithm>

#include <numeric>


namespace kcenon::thread

{


autoscaler::autoscaler(thread_pool& pool, autoscaling_policy policy)

    : pool_(pool)

    , policy_(std::move(policy))

    , last_sample_time_(std::chrono::steady_clock::now())

{

    // Initialize stats with current worker count

    std::scoped_lock<std::mutex> lock(stats_mutex_);

    stats_.min_workers = pool_.get_active_worker_count();

    stats_.peak_workers = stats_.min_workers;

}


autoscaler::~autoscaler()

{

    stop();

}


auto autoscaler::start() -> void

{

    bool expected = false;

    if (!running_.compare_exchange_strong(expected, true))

    {

        // Already running

        return;

    }


    // Start monitor thread

    monitor_thread_ = std::make_unique<std::thread>([this]() {

        monitor_loop();

    });

}


auto autoscaler::stop() -> void

{

    bool expected = true;

    if (!running_.compare_exchange_strong(expected, false))

    {

        // Already stopped

        return;

    }


    // Wake up monitor thread

    {

        std::lock_guard<std::mutex> lock(mutex_);

        cv_.notify_one();

    }


    // Wait for thread to complete

    if (monitor_thread_ && monitor_thread_->joinable())

    {

        monitor_thread_->join();

    }

    monitor_thread_.reset();

}


auto autoscaler::is_active() const -> bool

{

    return running_.load(std::memory_order_acquire);

}


auto autoscaler::evaluate_now() -> scaling_decision

{

    // Collect current metrics

    auto sample = collect_metrics();


    // Add to history

    {

        std::scoped_lock<std::mutex> lock(history_mutex_);

        metrics_history_.push_back(sample);

        if (metrics_history_.size() > 60)

        {

            metrics_history_.pop_front();

        }

    }


    // Get recent samples for decision

    std::vector<scaling_metrics_sample> samples;

    {

        std::scoped_lock<std::mutex> lock(history_mutex_);

        std::size_t count = std::min(metrics_history_.size(), policy_.samples_for_decision);

        samples.reserve(count);

        auto it = metrics_history_.end();

        std::advance(it, -static_cast<std::ptrdiff_t>(count));

        for (; it != metrics_history_.end(); ++it)

        {

            samples.push_back(*it);

        }

    }


    // Make decision

    return make_decision(samples);

}


auto autoscaler::scale_to(std::size_t target_workers) -> common::VoidResult

{

    // Clamp to policy bounds

    target_workers = std::clamp(target_workers, policy_.min_workers, policy_.max_workers);


    std::size_t current_workers = pool_.get_active_worker_count();


    if (target_workers > current_workers)

    {

        return add_workers(target_workers - current_workers);

    }

    else if (target_workers < current_workers)

    {

        return remove_workers(current_workers - target_workers);

    }


    return common::ok();

}


auto autoscaler::scale_up() -> common::VoidResult

{

    std::size_t current = pool_.get_active_worker_count();

    std::size_t increment = policy_.use_multiplicative_scaling

        ? static_cast<std::size_t>(current * (policy_.scale_up_factor - 1.0))

        : policy_.scale_up_increment;


    if (increment == 0)

    {

        increment = 1;

    }


    std::size_t target = std::min(current + increment, policy_.max_workers);

    return scale_to(target);

}


auto autoscaler::scale_down() -> common::VoidResult

{

    std::size_t current = pool_.get_active_worker_count();

    std::size_t target = current > policy_.scale_down_increment

        ? current - policy_.scale_down_increment

        : policy_.min_workers;


    target = std::max(target, policy_.min_workers);

    return scale_to(target);

}


auto autoscaler::set_policy(autoscaling_policy policy) -> void

{

    std::scoped_lock<std::mutex> lock(mutex_);

    policy_ = std::move(policy);

}


auto autoscaler::get_policy() const -> const autoscaling_policy&

{

    return policy_;

}


auto autoscaler::get_current_metrics() const -> scaling_metrics_sample

{

    return collect_metrics();

}


auto autoscaler::get_metrics_history(std::size_t count) const

    -> std::vector<scaling_metrics_sample>

{

    std::scoped_lock<std::mutex> lock(history_mutex_);


    std::vector<scaling_metrics_sample> result;

    std::size_t actual_count = std::min(count, metrics_history_.size());

    result.reserve(actual_count);


    auto it = metrics_history_.end();

    std::advance(it, -static_cast<std::ptrdiff_t>(actual_count));

    for (; it != metrics_history_.end(); ++it)

    {

        result.push_back(*it);

    }


    return result;

}


auto autoscaler::get_stats() const -> autoscaling_stats

{

    std::scoped_lock<std::mutex> lock(stats_mutex_);

    return stats_;

}


auto autoscaler::reset_stats() -> void

{

    std::scoped_lock<std::mutex> lock(stats_mutex_);

    stats_ = autoscaling_stats{};

    stats_.min_workers = pool_.get_active_worker_count();

    stats_.peak_workers = stats_.min_workers;

}


auto autoscaler::monitor_loop() -> void

{

    while (running_.load(std::memory_order_acquire))

    {

        // Wait for sample interval

        {

            std::unique_lock<std::mutex> lock(mutex_);

            cv_.wait_for(lock, policy_.sample_interval, [this]() {

                return !running_.load(std::memory_order_acquire);

            });

        }


        if (!running_.load(std::memory_order_acquire))

        {

            break;

        }


        // Skip if pool is not running

        if (!pool_.is_running())

        {

            continue;

        }


        // Collect metrics

        auto sample = collect_metrics();


        // Add to history

        {

            std::scoped_lock<std::mutex> lock(history_mutex_);

            metrics_history_.push_back(sample);


            // Keep max 60 samples (1 minute at 1s interval)

            while (metrics_history_.size() > 60)

            {

                metrics_history_.pop_front();

            }

        }


        // Only auto-scale in automatic mode

        if (policy_.scaling_mode != autoscaling_policy::mode::automatic)

        {

            continue;

        }


        // Collect samples for decision

        std::vector<scaling_metrics_sample> samples;

        {

            std::scoped_lock<std::mutex> lock(history_mutex_);

            std::size_t count = std::min(metrics_history_.size(), policy_.samples_for_decision);

            if (count < policy_.samples_for_decision)

            {

                // Not enough samples yet

                continue;

            }


            samples.reserve(count);

            auto it = metrics_history_.end();

            std::advance(it, -static_cast<std::ptrdiff_t>(count));

            for (; it != metrics_history_.end(); ++it)

            {

                samples.push_back(*it);

            }

        }


        // Make and execute decision

        auto decision = make_decision(samples);

        if (decision.should_scale())

        {

            execute_scaling(decision);

        }


        // Update stats

        {

            std::scoped_lock<std::mutex> lock(stats_mutex_);

            ++stats_.decisions_evaluated;


            std::size_t current = pool_.get_active_worker_count();

            stats_.peak_workers = std::max(stats_.peak_workers, current);

            if (stats_.min_workers == 0 || current < stats_.min_workers)

            {

                stats_.min_workers = current;

            }

        }

    }

}


auto autoscaler::collect_metrics() const -> scaling_metrics_sample

{

    auto now = std::chrono::steady_clock::now();


    scaling_metrics_sample sample;

    sample.timestamp = now;

    sample.worker_count = pool_.get_active_worker_count();

    sample.active_workers = sample.worker_count - pool_.get_idle_worker_count();

    sample.queue_depth = pool_.get_pending_task_count();


    // Calculate utilization

    if (sample.worker_count > 0)

    {

        sample.utilization = static_cast<double>(sample.active_workers) /

            static_cast<double>(sample.worker_count);

        sample.queue_depth_per_worker = static_cast<double>(sample.queue_depth) /

            static_cast<double>(sample.worker_count);

    }


    // Get metrics from pool

    auto metrics_snapshot = pool_.metrics().snapshot();

    sample.jobs_completed = metrics_snapshot.tasks_executed;

    sample.jobs_submitted = metrics_snapshot.tasks_submitted;


    // Calculate throughput if we have a previous sample

    auto duration = std::chrono::duration_cast<std::chrono::milliseconds>(

        now - last_sample_time_).count();

    if (duration > 0 && sample.jobs_completed >= last_jobs_completed_)

    {

        std::uint64_t jobs_delta = sample.jobs_completed - last_jobs_completed_;

        sample.throughput_per_second = static_cast<double>(jobs_delta) * 1000.0 /

            static_cast<double>(duration);

    }


    // Get P95 latency from enhanced metrics if available

    // Note: Using P99 wait time as closest approximation to P95

    if (pool_.is_enhanced_metrics_enabled())

    {

        auto enhanced_snapshot = pool_.enhanced_metrics_snapshot();

        // Convert from microseconds to milliseconds

        sample.p95_latency_ms = enhanced_snapshot.wait_time_p99_us / 1000.0;

    }


    // Update cached values for next sample

    const_cast<autoscaler*>(this)->last_jobs_completed_ = sample.jobs_completed;

    const_cast<autoscaler*>(this)->last_jobs_submitted_ = sample.jobs_submitted;

    const_cast<autoscaler*>(this)->last_sample_time_ = now;


    return sample;

}


auto autoscaler::make_decision(const std::vector<scaling_metrics_sample>& samples) const

    -> scaling_decision

{

    if (samples.empty())

    {

        return scaling_decision{};

    }


    // Calculate average metrics from samples

    double avg_utilization = 0.0;

    double avg_queue_depth_per_worker = 0.0;

    double avg_latency = 0.0;

    std::size_t avg_queue_depth = 0;


    for (const auto& sample : samples)

    {

        avg_utilization += sample.utilization;

        avg_queue_depth_per_worker += sample.queue_depth_per_worker;

        avg_latency += sample.p95_latency_ms;

        avg_queue_depth += sample.queue_depth;

    }


    auto sample_count = static_cast<double>(samples.size());

    avg_utilization /= sample_count;

    avg_queue_depth_per_worker /= sample_count;

    avg_latency /= sample_count;

    avg_queue_depth /= samples.size();


    std::size_t current_workers = pool_.get_active_worker_count();


    // Check scale-up triggers (ANY trigger)

    if (can_scale_up())

    {

        if (avg_utilization > policy_.scale_up.utilization_threshold)

        {

            std::size_t target = std::min(

                current_workers + policy_.scale_up_increment,

                policy_.max_workers);


            return scaling_decision{

                .direction = scaling_direction::up,

                .reason = scaling_reason::worker_utilization,

                .target_workers = target,

                .explanation = utility_module::formatter::format(

                    "Utilization {:.1f}% exceeds threshold {:.1f}%",

                    avg_utilization * 100, policy_.scale_up.utilization_threshold * 100)

            };

        }


        if (avg_queue_depth_per_worker > policy_.scale_up.queue_depth_threshold)

        {

            std::size_t target = std::min(

                current_workers + policy_.scale_up_increment,

                policy_.max_workers);


            return scaling_decision{

                .direction = scaling_direction::up,

                .reason = scaling_reason::queue_depth,

                .target_workers = target,

                .explanation = utility_module::formatter::format(

                    "Queue depth per worker {:.1f} exceeds threshold {:.1f}",

                    avg_queue_depth_per_worker, policy_.scale_up.queue_depth_threshold)

            };

        }


        if (avg_latency > policy_.scale_up.latency_threshold_ms && avg_latency > 0)

        {

            std::size_t target = std::min(

                current_workers + policy_.scale_up_increment,

                policy_.max_workers);


            return scaling_decision{

                .direction = scaling_direction::up,

                .reason = scaling_reason::latency,

                .target_workers = target,

                .explanation = utility_module::formatter::format(

                    "P95 latency {:.1f}ms exceeds threshold {:.1f}ms",

                    avg_latency, policy_.scale_up.latency_threshold_ms)

            };

        }


        if (avg_queue_depth > policy_.scale_up.pending_jobs_threshold)

        {

            std::size_t target = std::min(

                current_workers + policy_.scale_up_increment,

                policy_.max_workers);


            return scaling_decision{

                .direction = scaling_direction::up,

                .reason = scaling_reason::queue_depth,

                .target_workers = target,

                .explanation = utility_module::formatter::format(

                    "Queue depth {} exceeds threshold {}",

                    avg_queue_depth, policy_.scale_up.pending_jobs_threshold)

            };

        }

    }


    // Check scale-down triggers (ALL triggers)

    if (can_scale_down() && current_workers > policy_.min_workers)

    {

        bool utilization_ok = avg_utilization < policy_.scale_down.utilization_threshold;

        bool queue_depth_ok = avg_queue_depth_per_worker < policy_.scale_down.queue_depth_threshold;


        if (utilization_ok && queue_depth_ok)

        {

            std::size_t target = std::max(

                current_workers - policy_.scale_down_increment,

                policy_.min_workers);


            return scaling_decision{

                .direction = scaling_direction::down,

                .reason = scaling_reason::worker_utilization,

                .target_workers = target,

                .explanation = utility_module::formatter::format(

                    "Utilization {:.1f}% below threshold {:.1f}%, queue depth {:.1f} below {:.1f}",

                    avg_utilization * 100, policy_.scale_down.utilization_threshold * 100,

                    avg_queue_depth_per_worker, policy_.scale_down.queue_depth_threshold)

            };

        }

    }


    return scaling_decision{};

}


auto autoscaler::execute_scaling(const scaling_decision& decision) -> void

{

    std::size_t current_workers = pool_.get_active_worker_count();

    auto now = std::chrono::steady_clock::now();


    if (decision.direction == scaling_direction::up)

    {

        auto result = add_workers(decision.target_workers - current_workers);

        if (result.is_ok())

        {

            last_scale_up_time_ = now;


            std::scoped_lock<std::mutex> lock(stats_mutex_);

            ++stats_.scale_up_count;

            stats_.last_scale_up = now;


            if (policy_.scaling_callback)

            {

                policy_.scaling_callback(

                    scaling_direction::up,

                    decision.reason,

                    current_workers,

                    decision.target_workers);

            }

        }

    }

    else if (decision.direction == scaling_direction::down)

    {

        auto result = remove_workers(current_workers - decision.target_workers);

        if (result.is_ok())

        {

            last_scale_down_time_ = now;


            std::scoped_lock<std::mutex> lock(stats_mutex_);

            ++stats_.scale_down_count;

            stats_.last_scale_down = now;


            if (policy_.scaling_callback)

            {

                policy_.scaling_callback(

                    scaling_direction::down,

                    decision.reason,

                    current_workers,

                    decision.target_workers);

            }

        }

    }

}


auto autoscaler::can_scale_up() const -> bool

{

    if (pool_.get_active_worker_count() >= policy_.max_workers)

    {

        return false;

    }


    auto now = std::chrono::steady_clock::now();

    auto since_last = std::chrono::duration_cast<std::chrono::seconds>(

        now - last_scale_up_time_);


    return since_last >= policy_.scale_up_cooldown;

}


auto autoscaler::can_scale_down() const -> bool

{

    if (pool_.get_active_worker_count() <= policy_.min_workers)

    {

        return false;

    }


    auto now = std::chrono::steady_clock::now();

    auto since_last = std::chrono::duration_cast<std::chrono::seconds>(

        now - last_scale_down_time_);


    return since_last >= policy_.scale_down_cooldown;

}


auto autoscaler::add_workers(std::size_t count) -> common::VoidResult

{

    if (count == 0)

    {

        return common::ok();

    }


    // Get current context from pool

    const auto& context = pool_.get_context();


    for (std::size_t i = 0; i < count; ++i)

    {

        auto worker = std::make_unique<thread_worker>(true, context);

        auto result = pool_.enqueue(std::move(worker));

        if (result.is_err())

        {

            return result;

        }

    }


    return common::ok();

}


auto autoscaler::remove_workers(std::size_t count) -> common::VoidResult

{

    if (count == 0)

    {

        return common::ok();

    }


    // Request pool to remove workers using internal method

    // This will gracefully stop idle workers

    auto result = pool_.remove_workers_internal(count, policy_.min_workers);

    return result;

}


} // namespace kcenon::thread

autoscaler.h
Automatic scaling of thread pool workers based on load metrics.

kcenon::thread::autoscaler
Manages automatic scaling of thread pool workers based on load metrics.
Definition autoscaler.h:95

kcenon::thread::autoscaler::collect_metrics
auto collect_metrics() const -> scaling_metrics_sample
Collects current metrics from the pool.
Definition autoscaler.cpp:289

kcenon::thread::autoscaler::can_scale_down
auto can_scale_down() const -> bool
Checks if scale-down cooldown has elapsed.
Definition autoscaler.cpp:528

kcenon::thread::autoscaler::scale_to
auto scale_to(std::size_t target_workers) -> common::VoidResult
Manually scales to a specific worker count.
Definition autoscaler.cpp:108

kcenon::thread::autoscaler::last_jobs_submitted_
std::uint64_t last_jobs_submitted_
Definition autoscaler.h:291

kcenon::thread::autoscaler::running_
std::atomic< bool > running_
Definition autoscaler.h:274

kcenon::thread::autoscaler::last_sample_time_
std::chrono::steady_clock::time_point last_sample_time_
Definition autoscaler.h:292

kcenon::thread::autoscaler::is_active
auto is_active() const -> bool
Checks if the autoscaler is currently active.
Definition autoscaler.cpp:70

kcenon::thread::autoscaler::make_decision
auto make_decision(const std::vector< scaling_metrics_sample > &samples) const -> scaling_decision
Makes a scaling decision based on recent samples.
Definition autoscaler.cpp:340

kcenon::thread::autoscaler::pool_
thread_pool & pool_
Definition autoscaler.h:271

kcenon::thread::autoscaler::get_stats
auto get_stats() const -> autoscaling_stats
Gets autoscaling statistics.
Definition autoscaler.cpp:189

kcenon::thread::autoscaler::scale_up
auto scale_up() -> common::VoidResult
Manually scales up by the configured increment.
Definition autoscaler.cpp:127

kcenon::thread::autoscaler::policy_
autoscaling_policy policy_
Definition autoscaler.h:272

kcenon::thread::autoscaler::get_metrics_history
auto get_metrics_history(std::size_t count=60) const -> std::vector< scaling_metrics_sample >
Gets historical metrics samples.
Definition autoscaler.cpp:170

kcenon::thread::autoscaler::execute_scaling
auto execute_scaling(const scaling_decision &decision) -> void
Executes a scaling decision.
Definition autoscaler.cpp:465

kcenon::thread::autoscaler::evaluate_now
auto evaluate_now() -> scaling_decision
Manually triggers a scaling evaluation.
Definition autoscaler.cpp:75

kcenon::thread::autoscaler::last_scale_down_time_
std::chrono::steady_clock::time_point last_scale_down_time_
Definition autoscaler.h:284

kcenon::thread::autoscaler::stats_
autoscaling_stats stats_
Definition autoscaler.h:286

kcenon::thread::autoscaler::start
auto start() -> void
Starts the autoscaling monitor thread.
Definition autoscaler.cpp:32

kcenon::thread::autoscaler::stop
auto stop() -> void
Stops the autoscaling monitor thread.
Definition autoscaler.cpp:47

kcenon::thread::autoscaler::~autoscaler
~autoscaler()
Destructor. Stops the monitor thread if running.
Definition autoscaler.cpp:27

kcenon::thread::autoscaler::scale_down
auto scale_down() -> common::VoidResult
Manually scales down by the configured increment.
Definition autoscaler.cpp:143

kcenon::thread::autoscaler::last_jobs_completed_
std::uint64_t last_jobs_completed_
Definition autoscaler.h:290

kcenon::thread::autoscaler::reset_stats
auto reset_stats() -> void
Resets autoscaling statistics.
Definition autoscaler.cpp:195

kcenon::thread::autoscaler::get_current_metrics
auto get_current_metrics() const -> scaling_metrics_sample
Collects current metrics from the thread pool.
Definition autoscaler.cpp:165

kcenon::thread::autoscaler::can_scale_up
auto can_scale_up() const -> bool
Checks if scale-up cooldown has elapsed.
Definition autoscaler.cpp:514

kcenon::thread::autoscaler::get_policy
auto get_policy() const -> const autoscaling_policy &
Gets the current autoscaling policy.
Definition autoscaler.cpp:160

kcenon::thread::autoscaler::stats_mutex_
std::mutex stats_mutex_
Definition autoscaler.h:287

kcenon::thread::autoscaler::add_workers
auto add_workers(std::size_t count) -> common::VoidResult
Adds workers to the pool.
Definition autoscaler.cpp:542

kcenon::thread::autoscaler::autoscaler
autoscaler(thread_pool &pool, autoscaling_policy policy={})
Constructs an autoscaler for the given thread pool.
Definition autoscaler.cpp:16

kcenon::thread::autoscaler::remove_workers
auto remove_workers(std::size_t count) -> common::VoidResult
Removes workers from the pool.
Definition autoscaler.cpp:565

kcenon::thread::autoscaler::set_policy
auto set_policy(autoscaling_policy policy) -> void
Updates the autoscaling policy.
Definition autoscaler.cpp:154

kcenon::thread::autoscaler::last_scale_up_time_
std::chrono::steady_clock::time_point last_scale_up_time_
Definition autoscaler.h:283

kcenon::thread::autoscaler::monitor_loop
auto monitor_loop() -> void
Main monitoring loop running in the background thread.
Definition autoscaler.cpp:203

kcenon::thread::metrics::ThreadPoolMetrics::snapshot
Snapshot snapshot() const
Get a snapshot of all metrics.
Definition thread_pool_metrics.h:105

kcenon::thread::result
A template class representing either a value or an error.
Definition error_handling.h:252

kcenon::thread::result::is_ok
bool is_ok() const noexcept
Checks if the result is successful.
Definition error_handling.h:290

kcenon::thread::thread_pool
A thread pool for concurrent execution of jobs using multiple worker threads.
Definition thread_pool.h:182

kcenon::thread::thread_pool::is_enhanced_metrics_enabled
bool is_enhanced_metrics_enabled() const
Check if enhanced metrics is enabled.
Definition thread_pool.cpp:290

kcenon::thread::thread_pool::get_pending_task_count
auto get_pending_task_count() const -> std::size_t
Get the number of pending tasks in the queue.
Definition thread_pool.cpp:695

kcenon::thread::thread_pool::enhanced_metrics_snapshot
metrics::EnhancedSnapshot enhanced_metrics_snapshot() const
Get enhanced metrics snapshot.
Definition thread_pool.cpp:298

kcenon::thread::thread_pool::get_idle_worker_count
std::size_t get_idle_worker_count() const
Get the number of idle workers.
Definition thread_pool.cpp:679

kcenon::thread::thread_pool::get_active_worker_count
auto get_active_worker_count() const -> std::size_t
Get the current number of active (running) workers.
Definition thread_pool.cpp:755

kcenon::thread::thread_pool::metrics
const metrics::ThreadPoolMetrics & metrics() const noexcept
Access aggregated runtime metrics (read-only reference).
Definition thread_pool.cpp:273

utility_module::formatter::format
static auto format(const char *formats, const FormatArgs &... args) -> std::string
Formats a narrow-character string with the given arguments.
Definition formatter.h:129

thread_pool.h
Core thread pool implementation with work stealing and auto-scaling.

formatter.h
Generic formatter for enum types using user-provided converter functors.

kcenon::thread
Core threading foundation of the thread system library.
Definition thread_impl.h:17

kcenon::thread::scaling_direction::up
@ up
Scale up (add workers)

kcenon::thread::scaling_direction::down
@ down
Scale down (remove workers)

kcenon::thread::scaling_reason::latency
@ latency
Latency threshold exceeded.

kcenon::thread::scaling_reason::worker_utilization
@ worker_utilization
Worker utilization threshold exceeded.

kcenon::thread::scaling_reason::queue_depth
@ queue_depth
Queue depth threshold exceeded.

std
STL namespace.

kcenon::thread::autoscaling_policy
Configuration for autoscaling behavior.
Definition autoscaling_policy.h:52

kcenon::thread::autoscaling_policy::scale_down_cooldown
std::chrono::seconds scale_down_cooldown
Minimum time between scale-down events.
Definition autoscaling_policy.h:144

kcenon::thread::autoscaling_policy::mode::automatic
@ automatic
Fully automatic scaling.

kcenon::thread::autoscaling_policy::scale_up_cooldown
std::chrono::seconds scale_up_cooldown
Minimum time between scale-up events.
Definition autoscaling_policy.h:141

kcenon::thread::autoscaling_policy::min_workers
std::size_t min_workers
Minimum number of workers (never scale below this)
Definition autoscaling_policy.h:105

kcenon::thread::autoscaling_policy::max_workers
std::size_t max_workers
Maximum number of workers (never scale above this)
Definition autoscaling_policy.h:108

kcenon::thread::autoscaling_stats
Statistics for autoscaling operations.
Definition scaling_metrics.h:121

kcenon::thread::autoscaling_stats::peak_workers
std::size_t peak_workers
Peak worker count observed.
Definition scaling_metrics.h:138

kcenon::thread::autoscaling_stats::min_workers
std::size_t min_workers
Minimum worker count observed.
Definition scaling_metrics.h:141

kcenon::thread::scaling_decision
Scaling decision result.
Definition scaling_metrics.h:91

kcenon::thread::scaling_metrics_sample
Metrics sample for autoscaling decisions.
Definition scaling_metrics.h:52

kcenon::thread::scaling_metrics_sample::jobs_submitted
std::uint64_t jobs_submitted
Jobs submitted since last sample.
Definition scaling_metrics.h:78

kcenon::thread::scaling_metrics_sample::worker_count
std::size_t worker_count
Current number of workers in the pool.
Definition scaling_metrics.h:57

kcenon::thread::scaling_metrics_sample::timestamp
std::chrono::steady_clock::time_point timestamp
Timestamp when this sample was collected.
Definition scaling_metrics.h:54

kcenon::thread::scaling_metrics_sample::queue_depth_per_worker
double queue_depth_per_worker
Jobs per worker ratio.
Definition scaling_metrics.h:69

kcenon::thread::scaling_metrics_sample::jobs_completed
std::uint64_t jobs_completed
Jobs completed since last sample.
Definition scaling_metrics.h:75

kcenon::thread::scaling_metrics_sample::queue_depth
std::size_t queue_depth
Number of jobs waiting in the queue.
Definition scaling_metrics.h:63

kcenon::thread::scaling_metrics_sample::p95_latency_ms
double p95_latency_ms
P95 latency in milliseconds.
Definition scaling_metrics.h:72

kcenon::thread::scaling_metrics_sample::throughput_per_second
double throughput_per_second
Throughput in jobs per second.
Definition scaling_metrics.h:81

kcenon::thread::scaling_metrics_sample::active_workers
std::size_t active_workers
Number of workers currently processing jobs.
Definition scaling_metrics.h:60

kcenon::thread::scaling_metrics_sample::utilization
double utilization
Worker utilization ratio (0.0 - 1.0)
Definition scaling_metrics.h:66

thread_worker.h
Specialized worker thread that processes jobs from a job_queue.