thread_system/thread__worker_8cpp_source.html

// BSD 3-Clause License

// Copyright (c) 2024, 🍀☀🌕🌥 🌊

// See the LICENSE file in the project root for full license information.


#include <kcenon/thread/core/thread_worker.h>

#include <kcenon/thread/diagnostics/thread_pool_diagnostics.h>


#include <kcenon/thread/utils/formatter.h>


#include <thread>


// Platform-specific CPU pause intrinsics

#if defined(_MSC_VER) && (defined(_M_IX86) || defined(_M_X64))

    #include <emmintrin.h>  // For _mm_pause()

#endif


using namespace utility_module;


namespace kcenon::thread

{

    // Initialize static member

    std::atomic<std::size_t> thread_worker::next_worker_id_{0};


    thread_worker::thread_worker(const bool& use_time_tag, const thread_context& context)

        : thread_base("thread_worker"),

          worker_id_(next_worker_id_.fetch_add(1)),

          use_time_tag_(use_time_tag),

          job_queue_(nullptr),

          context_(context),

          worker_cancellation_token_(cancellation_token::create()),

          current_job_(nullptr)

    {

    }


    thread_worker::~thread_worker(void) {}


    auto thread_worker::set_job_queue(std::shared_ptr<job_queue> job_queue) -> void

    {

        std::shared_ptr<kcenon::thread::job_queue> old_queue;


        {

            std::unique_lock<std::mutex> lock(queue_mutex_);


            // Signal that queue replacement is in progress

            queue_being_replaced_ = true;


            // Wait for current job to complete

            // Predicate ensures we don't proceed while a job is executing

            queue_cv_.wait(lock, [this] {

                return current_job_.load(std::memory_order_acquire) == nullptr;

            });


            // Save old queue so we can wake any blocked dequeue() calls

            old_queue = job_queue_;


            // Replace the queue pointer

            job_queue_ = std::move(job_queue);


            // Clear replacement flag

            queue_being_replaced_ = false;


            // Notify worker thread that replacement is complete

            queue_cv_.notify_all();

        }


        // Stop the old queue outside the lock to wake any worker thread

        // blocked on old_queue->dequeue(). Without this, the worker's

        // do_work() would block indefinitely on the old queue's CV after

        // the queue pointer has been replaced.

        if (old_queue)

        {

            old_queue->stop();

        }

    }


auto thread_worker::set_context(const thread_context& context) -> void

{

    context_ = context;

}


void thread_worker::set_metrics(std::shared_ptr<metrics::ThreadPoolMetrics> metrics)

{

    metrics_ = std::move(metrics);

}


void thread_worker::set_diagnostics(diagnostics::thread_pool_diagnostics* diag)

{

    diagnostics_ = diag;

}


void thread_worker::set_diagnostics_sample_rate(std::uint32_t rate)

{

    diagnostics_sample_rate_ = (rate > 0) ? rate : 1;

}


void thread_worker::set_policy(const worker_policy& policy)

{

    policy_ = policy;


    // Initialize local deque if work-stealing is enabled

    if (policy_.enable_work_stealing && !local_deque_)

    {

        local_deque_ = std::make_unique<lockfree::work_stealing_deque<job*>>();

    }

}


const worker_policy& thread_worker::get_policy() const

{

    return policy_;

}


lockfree::work_stealing_deque<job*>* thread_worker::get_local_deque() noexcept

{

    return local_deque_.get();

}


void thread_worker::set_steal_function(std::function<job*(std::size_t)> steal_fn)

{

    steal_function_ = std::move(steal_fn);

}


std::unique_ptr<job> thread_worker::try_get_job()

{

    // If work-stealing is enabled, try local deque first (LIFO for cache locality)

    if (policy_.enable_work_stealing && local_deque_)

    {

        auto local_result = local_deque_->pop();

        if (local_result.has_value())

        {

            return std::unique_ptr<job>(*local_result);

        }

    }


    // Fallback to global queue

    std::lock_guard<std::mutex> lock(queue_mutex_);

    if (job_queue_ == nullptr)

    {

        return nullptr;

    }


    auto dequeue_result = job_queue_->try_dequeue();

    if (dequeue_result.is_ok())

    {

        return std::move(dequeue_result.value());

    }


    return nullptr;

}


std::unique_ptr<job> thread_worker::try_steal_work()

{

    if (!policy_.enable_work_stealing || !steal_function_)

    {

        return nullptr;

    }


    // Apply exponential backoff between steal attempts

    for (std::size_t attempt = 0; attempt < policy_.max_steal_attempts; ++attempt)

    {

        job* stolen = steal_function_(worker_id_);

        if (stolen != nullptr)

        {

            return std::unique_ptr<job>(stolen);

        }


        // Exponential backoff

        if (attempt > 0)

        {

            auto backoff = policy_.steal_backoff * (1 << (attempt - 1));

            std::this_thread::sleep_for(backoff);

        }

    }


    return nullptr;

}


    auto thread_worker::get_context(void) const -> const thread_context&

    {

        return context_;

    }


    auto thread_worker::should_continue_work() const -> bool

    {

        // Synchronize access to job_queue_ with set_job_queue() and do_work()

        std::lock_guard<std::mutex> lock(queue_mutex_);


        if (job_queue_ == nullptr)

        {

            return false;

        }


        // Continue while queue is not stopped - do_work() handles polling for jobs

        return !job_queue_->is_stopped();

    }


    auto thread_worker::do_work() -> common::VoidResult

    {

        // Acquire lock to safely get queue pointer

        std::unique_lock<std::mutex> lock(queue_mutex_);


        // Validate that job queue is available for processing

        if (job_queue_ == nullptr)

        {

            lock.unlock();

            return common::error_info{static_cast<int>(error_code::resource_allocation_failed), "there is no job_queue", "thread_system"};

        }


        // Make a local copy of the queue pointer while holding the lock

        // The shared_ptr keeps the queue alive even if set_job_queue() replaces it

        // No need to wait for !queue_being_replaced_ - the local copy is safe to use

        std::shared_ptr<job_queue> local_queue = job_queue_;


        // Release lock before dequeuing to allow other operations

        lock.unlock();


        std::unique_ptr<job> current_job;


        // Work-stealing path: try local deque first, then global queue, then steal

        if (policy_.enable_work_stealing)

        {

            // Step 1: Try local deque (LIFO for cache locality)

            if (local_deque_)

            {

                auto local_result = local_deque_->pop();

                if (local_result.has_value())

                {

                    current_job = std::unique_ptr<job>(*local_result);

                }

            }


            // Step 2: Try global queue

            if (!current_job)

            {

                auto dequeue_result = local_queue->try_dequeue();

                if (dequeue_result.is_ok())

                {

                    current_job = std::move(dequeue_result.value());

                }

            }


            // Step 3: Try to steal from other workers

            if (!current_job)

            {

                current_job = try_steal_work();

            }


            // No work found - mark as idle and sleep

            if (!current_job)

            {

                is_idle_.store(true, std::memory_order_relaxed);

                std::this_thread::sleep_for(policy_.idle_sleep_duration);

                return common::ok();

            }

        }

        else

        {

            // Original non-work-stealing path

            // Hybrid wait strategy: short spin followed by blocking dequeue

            // This approach provides:

            // - Sub-ms pickup latency (via spin loop)

            // - Near-zero idle CPU usage (via blocking dequeue)

            // - No busy-waiting overhead


            // Phase 1: Short bounded spin (16 iterations)

            // Optimized for scenarios where jobs arrive quickly

            constexpr int spin_count = 16;

            for (int i = 0; i < spin_count; ++i)

            {

                auto dequeue_result = local_queue->try_dequeue();

                if (dequeue_result.is_ok())

                {

                    // Job found during spin - fast path

                    current_job = std::move(dequeue_result.value());

                    break;

                }


                // CPU pause hint to reduce contention and power consumption

                // Different intrinsics per compiler and architecture

                #if defined(_MSC_VER)

                    // MSVC: Use _mm_pause() for x86/x64, YieldProcessor() for ARM

                    #if defined(_M_IX86) || defined(_M_X64)

                        _mm_pause();

                    #elif defined(_M_ARM) || defined(_M_ARM64)

                        __yield();

                    #else

                        std::this_thread::yield();

                    #endif

                #elif defined(__GNUC__) || defined(__clang__)

                    // GCC/Clang: Use builtin functions

                    #if defined(__x86_64__) || defined(__i386__)

                        __builtin_ia32_pause();

                    #elif defined(__aarch64__) || defined(__arm__)

                        __asm__ __volatile__("yield");

                    #else

                        std::this_thread::yield();

                    #endif

                #else

                    std::this_thread::yield();

                #endif

            }


            // Phase 2: Block on job_queue's condition variable if spin didn't find a job

            // Uses the queue's blocking dequeue() which waits on its internal CV.

            // This wakes immediately when a new job is enqueued (via notify_one)

            // or when the queue is stopped (via notify_all in job_queue::stop).

            if (!current_job)

            {

                is_idle_.store(true, std::memory_order_relaxed);


                // Blocking dequeue: waits on job_queue's condition_variable

                // Wakes on: enqueue() notify_one, or stop() notify_all

                auto dequeue_result = local_queue->dequeue();

                if (dequeue_result.is_ok())

                {

                    current_job = std::move(dequeue_result.value());

                }

                else

                {

                    // Queue is stopped or empty after wake — return to let

                    // should_continue_work() decide whether to exit

                    return common::ok();

                }

            }

        }


        // Validate job pointer

        if (current_job == nullptr)

        {

            return common::error_info{static_cast<int>(error_code::job_invalid), "error executing job: nullptr", "thread_system"};

        }


        // Capture job info for event tracing (before any state changes)

        const auto job_id = current_job->get_job_id();

        const auto job_name_for_event = current_job->get_name();

        const auto enqueue_time = current_job->get_enqueue_time();


        // Determine whether this job should record diagnostics events.

        // The sampling counter reduces clock-read overhead by skipping

        // events for most jobs when sample_rate > 1.

        const bool should_trace = diagnostics_

            && diagnostics_->is_tracing_enabled()

            && (++diagnostics_counter_ % diagnostics_sample_rate_ == 0);


        // Record dequeued event if tracing is enabled and sampled

        if (should_trace)

        {

            diagnostics::job_execution_event dequeued_event;

            dequeued_event.job_id = job_id;

            dequeued_event.job_name = job_name_for_event;

            dequeued_event.type = diagnostics::event_type::dequeued;

            dequeued_event.timestamp = std::chrono::steady_clock::now();

            dequeued_event.system_timestamp = std::chrono::system_clock::now();

            dequeued_event.thread_id = std::this_thread::get_id();

            dequeued_event.worker_id = worker_id_;

            dequeued_event.wait_time = std::chrono::duration_cast<std::chrono::nanoseconds>(

                dequeued_event.timestamp - enqueue_time);

            diagnostics_->record_event(dequeued_event);

        }


        // Update idle time statistics before transitioning to busy state

        auto now = std::chrono::steady_clock::now();

        auto state_since = get_state_since();

        if (is_idle_.load(std::memory_order_relaxed))

        {

            auto idle_duration = std::chrono::duration_cast<std::chrono::nanoseconds>(now - state_since);

            total_idle_time_ns_.fetch_add(

                static_cast<std::uint64_t>(idle_duration.count()),

                std::memory_order_relaxed

            );

        }


        // Mark worker as busy and update state timestamp

        is_idle_.store(false, std::memory_order_relaxed);

        state_since_rep_.store(now.time_since_epoch().count(), std::memory_order_release);

        current_job_start_time_ = now;


        // Initialize timing measurement if performance monitoring is enabled

        std::optional<std::chrono::time_point<std::chrono::high_resolution_clock>>

            started_time_point = std::nullopt;

        if (use_time_tag_)

        {

            started_time_point = std::chrono::high_resolution_clock::now();

        }


        // Associate the job with its source queue for potential re-submission

        // Use local_queue to avoid race with set_job_queue()

        current_job->set_job_queue(local_queue);


        // Set cancellation token on the job for cooperative cancellation

        // This allows the job to check if it should cancel during execution

        current_job->set_cancellation_token(worker_cancellation_token_);


        // Track currently executing job atomically for on_stop_requested()

        // Use release ordering to ensure job state is visible to cancellation thread

        current_job_.store(current_job.get(), std::memory_order_release);


        // Record started event if tracing is enabled and sampled

        if (should_trace)

        {

            diagnostics::job_execution_event started_event;

            started_event.job_id = job_id;

            started_event.job_name = job_name_for_event;

            started_event.type = diagnostics::event_type::started;

            started_event.timestamp = std::chrono::steady_clock::now();

            started_event.system_timestamp = std::chrono::system_clock::now();

            started_event.thread_id = std::this_thread::get_id();

            started_event.worker_id = worker_id_;

            started_event.wait_time = std::chrono::duration_cast<std::chrono::nanoseconds>(

                started_event.timestamp - enqueue_time);

            diagnostics_->record_event(started_event);

        }


        // Execute the job's work method and capture the result

        auto work_result = current_job->do_work();

        std::uint64_t execution_duration_ns = 0;

        if (started_time_point.has_value())

        {

            auto end_time = std::chrono::high_resolution_clock::now();

            execution_duration_ns = static_cast<std::uint64_t>(

                std::chrono::duration_cast<std::chrono::nanoseconds>(

                    end_time - started_time_point.value()).count());

        }


        // Capture job name before clearing (for logging after job destruction)

        std::string job_name = current_job->get_name();


        // Clear current job tracking and destroy job under mutex protection

        // This prevents race condition with on_stop_requested() (Issue #225)

        // The mutex ensures job is not accessed while being destroyed

        {

            std::lock_guard<std::mutex> notify_lock(queue_mutex_);

            current_job_.store(nullptr, std::memory_order_release);


            // Explicitly destroy the job while holding the mutex

            // This is critical for thread safety - on_stop_requested() acquires

            // the same mutex before accessing current_job_, ensuring it cannot

            // access a job that is being destroyed

            current_job.reset();


            // Notify any waiting set_job_queue() that job has completed

            // This allows queue replacement to proceed safely

            // Lock is held to prevent lost wakeup between predicate check and wait

            queue_cv_.notify_all();

        }


        // Update busy time and state transition for diagnostics

        {

            auto end_now = std::chrono::steady_clock::now();

            auto busy_duration = std::chrono::duration_cast<std::chrono::nanoseconds>(

                end_now - current_job_start_time_

            );

            total_busy_time_ns_.fetch_add(

                static_cast<std::uint64_t>(busy_duration.count()),

                std::memory_order_relaxed

            );

            // Transition back to idle state

            is_idle_.store(true, std::memory_order_relaxed);

            state_since_rep_.store(end_now.time_since_epoch().count(), std::memory_order_release);

        }


        if (work_result.is_err())

        {

            // Increment failed job counter

            jobs_failed_.fetch_add(1, std::memory_order_relaxed);


            // Record failed event if tracing is enabled and sampled

            if (should_trace)

            {

                diagnostics::job_execution_event failed_event;

                failed_event.job_id = job_id;

                failed_event.job_name = job_name_for_event;

                failed_event.type = diagnostics::event_type::failed;

                failed_event.timestamp = std::chrono::steady_clock::now();

                failed_event.system_timestamp = std::chrono::system_clock::now();

                failed_event.thread_id = std::this_thread::get_id();

                failed_event.worker_id = worker_id_;

                failed_event.wait_time = std::chrono::duration_cast<std::chrono::nanoseconds>(

                    current_job_start_time_ - enqueue_time);

                failed_event.execution_time = std::chrono::nanoseconds(execution_duration_ns);

                failed_event.error_code = work_result.error().code;

                failed_event.error_message = work_result.error().message;

                diagnostics_->record_event(failed_event);

            }


            if (metrics_)

            {

                metrics_->record_execution(0, false);

            }

            return common::error_info{static_cast<int>(error_code::job_execution_failed),

                formatter::format("error executing job: {}", work_result.error().message), "thread_system"};

        }


        // Increment completed job counter

        jobs_completed_.fetch_add(1, std::memory_order_relaxed);


        // Record completed event if tracing is enabled and sampled

        if (should_trace)

        {

            diagnostics::job_execution_event completed_event;

            completed_event.job_id = job_id;

            completed_event.job_name = job_name_for_event;

            completed_event.type = diagnostics::event_type::completed;

            completed_event.timestamp = std::chrono::steady_clock::now();

            completed_event.system_timestamp = std::chrono::system_clock::now();

            completed_event.thread_id = std::this_thread::get_id();

            completed_event.worker_id = worker_id_;

            completed_event.wait_time = std::chrono::duration_cast<std::chrono::nanoseconds>(

                current_job_start_time_ - enqueue_time);

            completed_event.execution_time = std::chrono::nanoseconds(execution_duration_ns);

            diagnostics_->record_event(completed_event);

        }


        // Log successful job completion based on timing configuration

        // Note: Using captured job_name since job is already destroyed

        if (!started_time_point.has_value())

        {

            // Standard logging without timing information

            context_.log(common::interfaces::log_level::debug,

                        formatter::format("job executed successfully: {} on thread_worker",

                                        job_name));

        }

        else

        {

            // Enhanced logging with execution timing information

            context_.log(common::interfaces::log_level::debug,

                        formatter::format("job executed successfully: {} on thread_worker ({}ns)",

                                        job_name, execution_duration_ns));


            // Update worker metrics if monitoring is available

            if (context_.monitoring())

            {

                common::interfaces::worker_metrics metrics(worker_id_);

                metrics.jobs_processed.value = 1;

                metrics.total_processing_time_ns.value = static_cast<double>(execution_duration_ns);

                // Use proper worker ID instead of thread hash

                context_.update_worker_metrics(worker_id_, metrics);

            }

        }


        if (metrics_)

        {

            metrics_->record_execution(execution_duration_ns, true);

        }


        return common::ok();

    }


    std::size_t thread_worker::get_worker_id() const

    {

        return worker_id_;

    }


    bool thread_worker::is_idle() const noexcept

    {

        return is_idle_.load(std::memory_order_relaxed);

    }


    auto thread_worker::on_stop_requested() -> void

    {

        // Cancel the worker's token first

        // This ensures any future jobs will see cancellation immediately

        // Jobs receive this token via set_cancellation_token() in do_work()

        worker_cancellation_token_.cancel();


        // Acquire mutex to safely access current job

        // This prevents race condition with do_work() job destruction (Issue #225)

        std::lock_guard<std::mutex> lock(queue_mutex_);


        // Load the currently executing job pointer atomically

        auto* job_ptr = current_job_.load(std::memory_order_acquire);


        // If a job is currently executing, cancel it directly

        if (job_ptr != nullptr)

        {

            // Get the job's cancellation token and cancel it

            // This provides redundancy in case the job cached its token before

            // we cancelled worker_cancellation_token_

            auto job_token = job_ptr->get_cancellation_token();

            job_token.cancel();


            // Log cancellation attempt for debugging

            context_.log(common::interfaces::log_level::debug,

                        formatter::format("Cancellation requested for job: {} on worker {}",

                                        job_ptr->get_name(), worker_id_));

        }

    }


    std::uint64_t thread_worker::get_jobs_completed() const noexcept

    {

        return jobs_completed_.load(std::memory_order_relaxed);

    }


    std::uint64_t thread_worker::get_jobs_failed() const noexcept

    {

        return jobs_failed_.load(std::memory_order_relaxed);

    }


    std::chrono::nanoseconds thread_worker::get_total_busy_time() const noexcept

    {

        return std::chrono::nanoseconds{total_busy_time_ns_.load(std::memory_order_relaxed)};

    }


    std::chrono::nanoseconds thread_worker::get_total_idle_time() const noexcept

    {

        return std::chrono::nanoseconds{total_idle_time_ns_.load(std::memory_order_relaxed)};

    }


    std::chrono::steady_clock::time_point thread_worker::get_state_since() const noexcept

    {

        auto rep = state_since_rep_.load(std::memory_order_acquire);

        return std::chrono::steady_clock::time_point{

            std::chrono::steady_clock::duration{rep}

        };

    }


    std::optional<diagnostics::job_info> thread_worker::get_current_job_info() const noexcept

    {

        std::lock_guard<std::mutex> lock(queue_mutex_);

        auto* job_ptr = current_job_.load(std::memory_order_acquire);

        if (job_ptr == nullptr)

        {

            return std::nullopt;

        }


        diagnostics::job_info info;

        info.job_id = job_ptr->get_job_id();

        info.job_name = job_ptr->get_name();

        info.status = diagnostics::job_status::running;

        info.start_time = current_job_start_time_;

        info.enqueue_time = job_ptr->get_enqueue_time();

        info.executed_by = std::this_thread::get_id();


        auto now = std::chrono::steady_clock::now();

        info.execution_time = std::chrono::duration_cast<std::chrono::nanoseconds>(

            now - current_job_start_time_

        );

        // Calculate wait time from enqueue to start

        info.wait_time = std::chrono::duration_cast<std::chrono::nanoseconds>(

            current_job_start_time_ - job_ptr->get_enqueue_time()

        );


        return info;

    }


} // namespace kcenon::thread

kcenon::thread::cancellation_token
Provides a mechanism for cooperative cancellation of operations.
Definition cancellation_token.h:30

kcenon::thread::diagnostics::thread_pool_diagnostics
Comprehensive diagnostics API for thread pool monitoring.
Definition thread_pool_diagnostics.h:143

kcenon::thread::job_queue
A thread-safe job queue for managing and dispatching work items.
Definition job_queue.h:65

kcenon::thread::job
Represents a unit of work (task) to be executed, typically by a job queue.
Definition job.h:136

kcenon::thread::lockfree::work_stealing_deque
Lock-free work-stealing deque based on Chase-Lev algorithm.
Definition numa_work_stealer.h:36

kcenon::thread::thread_base
A foundational class for implementing custom worker threads.
Definition thread_base.h:142

kcenon::thread::thread_context
Context object that provides access to optional services.
Definition thread_context.h:40

kcenon::thread::thread_worker::diagnostics_
diagnostics::thread_pool_diagnostics * diagnostics_
Pointer to the diagnostics instance for event tracing.
Definition thread_worker.h:327

kcenon::thread::thread_worker::total_idle_time_ns_
std::atomic< std::uint64_t > total_idle_time_ns_
Total time spent waiting for jobs (idle time) in nanoseconds.
Definition thread_worker.h:408

kcenon::thread::thread_worker::steal_function_
std::function< job *(std::size_t)> steal_function_
Function to steal work from other workers.
Definition thread_worker.h:477

kcenon::thread::thread_worker::get_worker_id
std::size_t get_worker_id() const
Get the worker ID.
Definition thread_worker.cpp:735

kcenon::thread::thread_worker::worker_id_
std::size_t worker_id_
Unique ID for this worker instance.
Definition thread_worker.h:289

kcenon::thread::thread_worker::total_busy_time_ns_
std::atomic< std::uint64_t > total_busy_time_ns_
Total time spent executing jobs (busy time) in nanoseconds.
Definition thread_worker.h:401

kcenon::thread::thread_worker::try_steal_work
std::unique_ptr< job > try_steal_work()
Try to steal work from other workers.
Definition thread_worker.cpp:237

kcenon::thread::thread_worker::get_jobs_failed
std::uint64_t get_jobs_failed() const noexcept
Gets the total number of jobs that failed during execution.
Definition thread_worker.cpp:819

kcenon::thread::thread_worker::set_diagnostics
void set_diagnostics(diagnostics::thread_pool_diagnostics *diag)
Set the diagnostics instance for event tracing.
Definition thread_worker.cpp:173

kcenon::thread::thread_worker::set_steal_function
void set_steal_function(std::function< job *(std::size_t)> steal_fn)
Set the steal function for finding other workers' deques.
Definition thread_worker.cpp:204

kcenon::thread::thread_worker::get_policy
const worker_policy & get_policy() const
Get the current worker policy.
Definition thread_worker.cpp:194

kcenon::thread::thread_worker::get_total_busy_time
std::chrono::nanoseconds get_total_busy_time() const noexcept
Gets the total time spent executing jobs (busy time).
Definition thread_worker.cpp:824

kcenon::thread::thread_worker::next_worker_id_
static std::atomic< std::size_t > next_worker_id_
Static counter for generating unique worker IDs.
Definition thread_worker.h:284

kcenon::thread::thread_worker::get_context
auto get_context(void) const -> const thread_context &
Gets the thread context for this worker.
Definition thread_worker.cpp:269

kcenon::thread::thread_worker::set_metrics
void set_metrics(std::shared_ptr< metrics::ThreadPoolMetrics > metrics)
Provide shared metrics storage for this worker.
Definition thread_worker.cpp:168

kcenon::thread::thread_worker::diagnostics_sample_rate_
std::uint32_t diagnostics_sample_rate_
Diagnostics sampling rate (record every Nth job).
Definition thread_worker.h:343

kcenon::thread::thread_worker::is_idle
bool is_idle() const noexcept
Checks if the worker is currently idle (not processing a job).
Definition thread_worker.cpp:750

kcenon::thread::thread_worker::metrics_
std::shared_ptr< metrics::ThreadPoolMetrics > metrics_
Shared metrics aggregator provided by the owning thread pool.
Definition thread_worker.h:319

kcenon::thread::thread_worker::local_deque_
std::unique_ptr< lockfree::work_stealing_deque< job * > > local_deque_
Local work-stealing deque for this worker.
Definition thread_worker.h:469

kcenon::thread::thread_worker::set_diagnostics_sample_rate
void set_diagnostics_sample_rate(std::uint32_t rate)
Set the diagnostics sampling rate.
Definition thread_worker.cpp:178

kcenon::thread::thread_worker::should_continue_work
auto should_continue_work() const -> bool override
Determines if there are jobs available in the queue to continue working on.
Definition thread_worker.cpp:317

kcenon::thread::thread_worker::get_jobs_completed
std::uint64_t get_jobs_completed() const noexcept
Gets the total number of jobs successfully completed by this worker.
Definition thread_worker.cpp:814

kcenon::thread::thread_worker::set_context
auto set_context(const thread_context &context) -> void
Sets the thread context for this worker.
Definition thread_worker.cpp:163

kcenon::thread::thread_worker::state_since_rep_
std::atomic< std::chrono::steady_clock::time_point::rep > state_since_rep_
Time point when the worker entered its current state.
Definition thread_worker.h:416

kcenon::thread::thread_worker::current_job_start_time_
std::chrono::steady_clock::time_point current_job_start_time_
Time point when the current job started executing.
Definition thread_worker.h:426

kcenon::thread::thread_worker::set_policy
void set_policy(const worker_policy &policy)
Set the worker policy for this worker.
Definition thread_worker.cpp:183

kcenon::thread::thread_worker::get_total_idle_time
std::chrono::nanoseconds get_total_idle_time() const noexcept
Gets the total time spent waiting for jobs (idle time).
Definition thread_worker.cpp:829

kcenon::thread::thread_worker::on_stop_requested
auto on_stop_requested() -> void override
Called when the worker is requested to stop.
Definition thread_worker.cpp:784

kcenon::thread::thread_worker::policy_
worker_policy policy_
Worker policy configuration.
Definition thread_worker.h:459

kcenon::thread::thread_worker::try_get_job
std::unique_ptr< job > try_get_job()
Try to get a job from local deque first, then global queue.
Definition thread_worker.cpp:209

kcenon::thread::thread_worker::get_local_deque
lockfree::work_stealing_deque< job * > * get_local_deque() noexcept
Get the local work-stealing deque for this worker.
Definition thread_worker.cpp:199

kcenon::thread::thread_worker::is_idle_
std::atomic< bool > is_idle_
Indicates whether the worker is currently idle (not processing a job).
Definition thread_worker.h:380

kcenon::thread::thread_worker::jobs_completed_
std::atomic< std::uint64_t > jobs_completed_
Total number of jobs successfully completed by this worker.
Definition thread_worker.h:387

kcenon::thread::thread_worker::~thread_worker
virtual ~thread_worker(void)
Virtual destructor. Ensures the worker thread is stopped before destruction.
Definition thread_worker.cpp:89

kcenon::thread::thread_worker::job_queue_
std::shared_ptr< job_queue > job_queue_
A shared pointer to the job queue from which this worker obtains jobs.
Definition thread_worker.h:306

kcenon::thread::thread_worker::thread_worker
thread_worker(const bool &use_time_tag=true, const thread_context &context=thread_context())
Constructs a new thread_worker.
Definition thread_worker.cpp:70

kcenon::thread::thread_worker::do_work
auto do_work() -> common::VoidResult override
Processes one or more jobs from the queue.
Definition thread_worker.cpp:383

kcenon::thread::thread_worker::set_job_queue
auto set_job_queue(std::shared_ptr< job_queue > job_queue) -> void
Sets the job_queue that this worker should process.
Definition thread_worker.cpp:114

kcenon::thread::thread_worker::current_job_
std::atomic< job * > current_job_
Pointer to the currently executing job.
Definition thread_worker.h:366

kcenon::thread::thread_worker::queue_mutex_
std::mutex queue_mutex_
Mutex protecting job queue replacement.
Definition thread_worker.h:437

kcenon::thread::thread_worker::jobs_failed_
std::atomic< std::uint64_t > jobs_failed_
Total number of jobs that failed during execution.
Definition thread_worker.h:394

kcenon::thread::thread_worker::get_current_job_info
std::optional< diagnostics::job_info > get_current_job_info() const noexcept
Gets information about the currently executing job.
Definition thread_worker.cpp:842

kcenon::thread::thread_worker::get_state_since
std::chrono::steady_clock::time_point get_state_since() const noexcept
Gets the time when the worker entered its current state.
Definition thread_worker.cpp:834

kcenon::thread::utils::formatter::format
static auto format(const char *formats, const FormatArgs &... args) -> std::string
Formats a narrow-character string with the given arguments.
Definition formatter.h:132

kcenon::thread::diagnostics::job_status::running
@ running
Job is currently being executed.

kcenon::thread::diagnostics::event_type::dequeued
@ dequeued
Job was taken from queue by a worker.

kcenon::thread::diagnostics::event_type::failed
@ failed
Job failed with an error.

kcenon::thread::diagnostics::event_type::started
@ started
Job execution started.

kcenon::thread::diagnostics::event_type::completed
@ completed
Job completed successfully.

formatter.h
Generic formatter for enum types using user-provided converter functors.

kcenon::thread::utils
Definition compatibility.h:20

kcenon::thread
Core threading foundation of the thread system library.
Definition thread_impl.h:17

kcenon::thread::error_code::job_invalid
@ job_invalid

kcenon::thread::error_code::job_execution_failed
@ job_execution_failed

kcenon::thread::error_code::resource_allocation_failed
@ resource_allocation_failed

kcenon::thread::job_id
std::uint64_t job_id
Unique job identifier for DAG scheduler.
Definition dag_job.h:33

kcenon::thread::log_level_v2::info
@ info
Informational messages highlighting progress.

kcenon::thread::diagnostics::job_execution_event
Event data for job execution tracing.
Definition execution_event.h:98

kcenon::thread::diagnostics::job_execution_event::job_name
std::string job_name
Human-readable name of the job.
Definition execution_event.h:114

kcenon::thread::diagnostics::job_execution_event::wait_time
std::chrono::nanoseconds wait_time
Time spent waiting in queue before dequeue.
Definition execution_event.h:154

kcenon::thread::diagnostics::job_execution_event::error_message
std::optional< std::string > error_message
Error message if the job failed.
Definition execution_event.h:175

kcenon::thread::diagnostics::job_execution_event::execution_time
std::chrono::nanoseconds execution_time
Time spent executing the job.
Definition execution_event.h:161

kcenon::thread::diagnostics::job_execution_event::job_id
std::uint64_t job_id
ID of the job this event relates to.
Definition execution_event.h:109

kcenon::thread::diagnostics::job_execution_event::type
event_type type
Type of event that occurred.
Definition execution_event.h:119

kcenon::thread::diagnostics::job_execution_event::error_code
std::optional< int > error_code
Error code if the job failed.
Definition execution_event.h:170

kcenon::thread::diagnostics::job_execution_event::worker_id
std::size_t worker_id
Worker ID that processed this job.
Definition execution_event.h:143

kcenon::thread::diagnostics::job_execution_event::thread_id
std::thread::id thread_id
ID of the thread that processed this event.
Definition execution_event.h:138

kcenon::thread::diagnostics::job_execution_event::system_timestamp
std::chrono::system_clock::time_point system_timestamp
System time when the event occurred.
Definition execution_event.h:131

kcenon::thread::diagnostics::job_execution_event::timestamp
std::chrono::steady_clock::time_point timestamp
Time when the event occurred.
Definition execution_event.h:124

kcenon::thread::diagnostics::job_info
Information about a job in the thread pool.
Definition job_info.h:90

kcenon::thread::diagnostics::job_info::job_id
std::uint64_t job_id
Unique identifier for this job.
Definition job_info.h:97

kcenon::thread::worker_policy
Worker behavior policy configuration.
Definition worker_policy.h:62

kcenon::thread::worker_policy::steal_backoff
std::chrono::microseconds steal_backoff
Definition worker_policy.h:76

kcenon::thread::worker_policy::max_steal_attempts
size_t max_steal_attempts
Definition worker_policy.h:75

kcenon::thread::worker_policy::enable_work_stealing
bool enable_work_stealing
Definition worker_policy.h:73

thread_pool_diagnostics.h
Runtime diagnostics, health monitoring, and execution tracing for thread pools.

thread_worker.h
Specialized worker thread that processes jobs from a job_queue.