logger_system/batch__processor_8cpp_source.html

// BSD 3-Clause License

// Copyright (c) 2025, 🍀☀🌕🌥 🌊

// See the LICENSE file in the project root for full license information.


#include "batch_processor.h"

#include "../memory/object_pool.h"

#include "jthread_compat.h"


#include <algorithm>

#include <chrono>

#include <condition_variable>

#include <thread>


namespace kcenon::logger::async {


class batch_processing_jthread_worker {

public:

    using process_callback = std::function<void()>;


    explicit batch_processing_jthread_worker(process_callback callback,

                                             std::mutex& notify_mutex,

                                             std::condition_variable& notify_cv)

        : callback_(std::move(callback))

        , notify_mutex_(notify_mutex)

        , notify_cv_(notify_cv)

#if !LOGGER_HAS_JTHREAD

        , stop_source_(std::make_shared<simple_stop_source>())

#endif

    {}


    ~batch_processing_jthread_worker() {

        stop();

    }


    void start() {

        if (running_.exchange(true, std::memory_order_acq_rel)) {

            return;  // Already started

        }


#if LOGGER_HAS_JTHREAD

        auto callback = callback_;

        auto& cv = notify_cv_;

        auto& mtx = notify_mutex_;

        thread_ = compat_jthread([callback, &cv, &mtx](std::stop_token stop_token) {

            while (!stop_token.stop_requested()) {

                if (callback) {

                    callback();

                }

                // Wait for notification or timeout instead of polling

                std::unique_lock<std::mutex> lock(mtx);

                cv.wait_for(lock, std::chrono::milliseconds(10),

                            [&stop_token]{ return stop_token.stop_requested(); });

            }

        });

#else

        // Reset stop source for new start

        stop_source_->reset();


        auto callback = callback_;

        auto stop = stop_source_;

        auto& cv = notify_cv_;

        auto& mtx = notify_mutex_;

        thread_ = compat_jthread([callback, stop, &cv, &mtx](simple_stop_source& /*unused*/) {

            while (!stop->stop_requested()) {

                if (callback) {

                    callback();

                }

                // Wait for notification or timeout instead of polling

                std::unique_lock<std::mutex> lock(mtx);

                cv.wait_for(lock, std::chrono::milliseconds(10),

                            [&stop]{ return stop->stop_requested(); });

            }

        });

#endif

    }


    void stop() {

        if (!running_.exchange(false, std::memory_order_acq_rel)) {

            return;  // Already stopped

        }


        // Request stop and join thread

        thread_.request_stop();

        thread_.join();

    }


    [[nodiscard]] bool is_running() const noexcept {

        return running_.load(std::memory_order_acquire);

    }


private:

    process_callback callback_;

    std::mutex& notify_mutex_;

    std::condition_variable& notify_cv_;

    compat_jthread thread_;

    std::atomic<bool> running_{false};

#if !LOGGER_HAS_JTHREAD

    std::shared_ptr<simple_stop_source> stop_source_;

#endif

};


batch_processor::batch_processor(log_writer_ptr writer, const config& cfg)

    : config_(cfg)

    , writer_(std::move(writer))

    , queue_(std::make_unique<lockfree_spsc_queue<batch_entry, queue_size>>())

    , current_batch_size_(cfg.initial_batch_size)

    , current_wait_time_(cfg.max_wait_time)

    , last_adjustment_time_(std::chrono::steady_clock::now()) {


    if (!writer_) {

        throw std::invalid_argument("Writer cannot be null");

    }


    // Validate configuration

    if (cfg.min_batch_size > cfg.max_batch_size) {

        throw std::invalid_argument("min_batch_size cannot be greater than max_batch_size");

    }


    if (cfg.initial_batch_size < cfg.min_batch_size || cfg.initial_batch_size > cfg.max_batch_size) {

        throw std::invalid_argument("initial_batch_size must be within min/max range");

    }

}


batch_processor::~batch_processor() {

    stop(true);

}


bool batch_processor::start() {

    bool expected = false;

    if (!running_.compare_exchange_strong(expected, true)) {

        return false; // Already running

    }


    should_stop_ = false;

    processing_worker_ = std::make_unique<batch_processing_jthread_worker>(

        [this] { process_loop_iteration(); }, notify_mutex_, notify_cv_);

    processing_worker_->start();

    return true;

}


void batch_processor::stop(bool flush_remaining) {

    if (!running_.exchange(false)) {

        return; // Already stopped

    }


    should_stop_ = true;


    // Wake the worker so it can observe should_stop_ and exit

    notify_cv_.notify_one();


    if (processing_worker_) {

        processing_worker_->stop();

        processing_worker_.reset();

    }


    if (flush_remaining) {

        // Process any remaining entries

        batch_entry entry;

        std::vector<batch_entry> final_batch;

        final_batch.reserve(queue_size);


        while (queue_->dequeue(entry)) {

            final_batch.push_back(std::move(entry));

        }


        if (!final_batch.empty()) {

            process_batch(final_batch);

        }


        if (writer_) {

            writer_->flush();

        }

    }

}


bool batch_processor::add_entry(batch_entry&& entry) {

    if (!running_.load(std::memory_order_relaxed)) {

        return false;

    }


    if (!queue_->enqueue(std::move(entry))) {

        stats_.dropped_entries.fetch_add(1, std::memory_order_relaxed);

        return false;

    }


    // Wake the worker thread immediately

    notify_cv_.notify_one();


    return true;

}


bool batch_processor::add_entry(const batch_entry& entry) {

    return add_entry(batch_entry(entry));

}


void batch_processor::flush() {

    // This is handled by the processing loop

    // We could add a flush signal mechanism here if needed

}


bool batch_processor::is_healthy() const {

    return running_.load(std::memory_order_relaxed) &&

           writer_ && writer_->is_healthy();

}


size_t batch_processor::get_queue_size() const {

    return queue_->size();

}


void batch_processor::process_loop_iteration() {

    static thread_local std::chrono::steady_clock::time_point last_flush_time = std::chrono::steady_clock::now();

    static thread_local std::chrono::steady_clock::time_point last_adjustment_time = std::chrono::steady_clock::now();


    const auto batch_size = current_batch_size_.load(std::memory_order_relaxed);

    const auto wait_time = current_wait_time_.load(std::memory_order_relaxed);


    std::vector<batch_entry> current_batch;

    current_batch.reserve(batch_size);


    const auto deadline = std::chrono::steady_clock::now() + wait_time;

    const auto entries_collected = collect_entries(current_batch, batch_size, deadline);


    if (entries_collected > 0) {

        const auto process_start = std::chrono::steady_clock::now();

        const auto processed = process_batch(current_batch);

        const auto process_end = std::chrono::steady_clock::now();


        const auto processing_time = process_end - process_start;

        const bool flushed_by_size = (entries_collected >= batch_size);

        const bool flushed_by_time = should_flush_by_time(last_flush_time);


        std::string flush_reason;

        if (flushed_by_size) {

            flush_reason = "size";

            stats_.flush_by_size.fetch_add(1, std::memory_order_relaxed);

        } else if (flushed_by_time) {

            flush_reason = "time";

            stats_.flush_by_time.fetch_add(1, std::memory_order_relaxed);

        } else {

            flush_reason = "partial";

        }


        update_stats(processed, processing_time, flush_reason);

        last_flush_time = process_end;


        // Handle back-pressure

        if (config_.enable_back_pressure) {

            handle_back_pressure();

        }


        // Dynamic batch size adjustment

        if (config_.enable_dynamic_sizing) {

            const auto now = std::chrono::steady_clock::now();

            if (now - last_adjustment_time > std::chrono::seconds(5)) {

                adjust_batch_size();

                last_adjustment_time = now;

            }

        }

    }

}


size_t batch_processor::collect_entries(std::vector<batch_entry>& batch,

                                       size_t max_entries,

                                       std::chrono::steady_clock::time_point deadline) {

    size_t collected = 0;

    batch_entry entry;


    while (collected < max_entries && std::chrono::steady_clock::now() < deadline) {

        if (queue_->dequeue(entry)) {

            batch.push_back(std::move(entry));

            ++collected;

        } else {

            // Queue is empty, wait for notification or remaining deadline

            auto remaining = deadline - std::chrono::steady_clock::now();

            if (remaining <= std::chrono::steady_clock::duration::zero()) {

                break;

            }

            std::unique_lock<std::mutex> lock(notify_mutex_);

            notify_cv_.wait_for(lock, remaining,

                                [this]{ return queue_->size() > 0 || should_stop_.load(std::memory_order_relaxed); });

        }

    }


    // Try to collect more entries if we have time left and space

    while (collected < max_entries && queue_->dequeue(entry)) {

        batch.push_back(std::move(entry));

        ++collected;

    }


    return collected;

}


size_t batch_processor::process_batch(std::vector<batch_entry>& batch) {

    if (batch.empty() || !writer_) {

        return 0;

    }


    size_t processed = 0;

    for (const auto& entry : batch) {

        // Create log_entry from batch_entry

        log_entry log_ent(entry.level, entry.message, entry.file,

                         entry.line, entry.function, entry.timestamp);


        auto result = writer_->write(log_ent);

        if (result.is_ok()) {

            ++processed;

        }

    }


    // Flush after batch processing

    writer_->flush();


    stats_.total_batches.fetch_add(1, std::memory_order_relaxed);

    stats_.total_entries.fetch_add(processed, std::memory_order_relaxed);


    return processed;

}


void batch_processor::adjust_batch_size() {

    const auto current_size = current_batch_size_.load(std::memory_order_relaxed);

    const auto queue_size = get_queue_size();

    const auto recent_time = recent_processing_time_ms_.load(std::memory_order_relaxed);


    size_t new_size = current_size;


    // Increase batch size if queue is building up and processing is fast

    if (queue_size > current_size * 2 && recent_time < 10.0) {

        new_size = std::min(config_.max_batch_size,

                           static_cast<size_t>(current_size * config_.size_increase_factor));

    }

    // Decrease batch size if processing is slow or queue is small

    else if (recent_time > 100.0 || queue_size < current_size / 4) {

        new_size = std::max(config_.min_batch_size,

                           static_cast<size_t>(current_size * config_.size_decrease_factor));

    }


    if (new_size != current_size) {

        current_batch_size_.store(new_size, std::memory_order_relaxed);

        stats_.dynamic_size_adjustments.fetch_add(1, std::memory_order_relaxed);

    }

}


bool batch_processor::handle_back_pressure() {

    const auto queue_size = get_queue_size();


    if (queue_size > config_.back_pressure_threshold) {

        stats_.back_pressure_events.fetch_add(1, std::memory_order_relaxed);


        // Apply back-pressure delay

        std::this_thread::sleep_for(config_.back_pressure_delay);


        return queue_size < queue_size * 1.5; // Continue if queue isn't growing too fast

    }


    return true;

}


bool batch_processor::should_flush_by_time(std::chrono::steady_clock::time_point last_flush_time) const {

    const auto now = std::chrono::steady_clock::now();

    const auto elapsed = now - last_flush_time;

    const auto current_wait = current_wait_time_.load(std::memory_order_relaxed);


    return elapsed >= current_wait;

}


void batch_processor::update_stats(size_t batch_size,

                                  std::chrono::nanoseconds processing_time,

                                  const std::string& flush_reason) {

    (void)batch_size;  // Suppress unused parameter warning

    (void)flush_reason;  // Suppress unused parameter warning

    const double processing_time_ms =

        std::chrono::duration_cast<std::chrono::microseconds>(processing_time).count() / 1000.0;


    // Update recent processing time (exponential moving average)

    const double alpha = 0.1;

    const double current_time = recent_processing_time_ms_.load(std::memory_order_relaxed);

    const double new_time = alpha * processing_time_ms + (1.0 - alpha) * current_time;

    recent_processing_time_ms_.store(new_time, std::memory_order_relaxed);


    // Update average batch size

    const auto total_batches = stats_.total_batches.load(std::memory_order_relaxed);

    if (total_batches > 0) {

        const auto total_entries = stats_.total_entries.load(std::memory_order_relaxed);

        const double avg_size = static_cast<double>(total_entries) / total_batches;

        stats_.average_batch_size.store(avg_size, std::memory_order_relaxed);

    }


    // Update average processing time

    stats_.average_processing_time_ms.store(

        recent_processing_time_ms_.load(std::memory_order_relaxed),

        std::memory_order_relaxed);


    // Update recent queue size for adjustment algorithm

    recent_queue_size_.store(get_queue_size(), std::memory_order_relaxed);

}


std::unique_ptr<batch_processor> make_batch_processor(

    log_writer_ptr writer,

    const batch_processor::config& cfg) {

    return std::make_unique<batch_processor>(std::move(writer), cfg);

}


} // namespace kcenon::logger::async

batch_processor.h
Optimized batch processing engine for log entries.

kcenon::logger::async::batch_processing_jthread_worker
Worker thread for batch processing with jthread compatibility.
Definition batch_processor.cpp:33

kcenon::logger::async::batch_processing_jthread_worker::notify_cv_
std::condition_variable & notify_cv_
Definition batch_processor.cpp:111

kcenon::logger::async::batch_processing_jthread_worker::process_callback
std::function< void()> process_callback
Definition batch_processor.cpp:35

kcenon::logger::async::batch_processing_jthread_worker::stop_source_
std::shared_ptr< simple_stop_source > stop_source_
Definition batch_processor.cpp:115

kcenon::logger::async::batch_processing_jthread_worker::~batch_processing_jthread_worker
~batch_processing_jthread_worker()
Definition batch_processor.cpp:48

kcenon::logger::async::batch_processing_jthread_worker::start
void start()
Definition batch_processor.cpp:52

kcenon::logger::async::batch_processing_jthread_worker::stop
void stop()
Definition batch_processor.cpp:94

kcenon::logger::async::batch_processing_jthread_worker::batch_processing_jthread_worker
batch_processing_jthread_worker(process_callback callback, std::mutex &notify_mutex, std::condition_variable &notify_cv)
Definition batch_processor.cpp:37

kcenon::logger::async::batch_processing_jthread_worker::notify_mutex_
std::mutex & notify_mutex_
Definition batch_processor.cpp:110

kcenon::logger::async::batch_processing_jthread_worker::thread_
compat_jthread thread_
Definition batch_processor.cpp:112

kcenon::logger::async::batch_processing_jthread_worker::is_running
bool is_running() const noexcept
Definition batch_processor.cpp:104

kcenon::logger::async::batch_processing_jthread_worker::running_
std::atomic< bool > running_
Definition batch_processor.cpp:113

kcenon::logger::async::batch_processing_jthread_worker::callback_
process_callback callback_
Definition batch_processor.cpp:109

kcenon::logger::async::batch_processor::stop
void stop(bool flush_remaining=true)
Stop the batch processor.
Definition batch_processor.cpp:158

kcenon::logger::async::batch_processor::current_wait_time_
std::atomic< std::chrono::milliseconds > current_wait_time_
Definition batch_processor.h:267

kcenon::logger::async::batch_processor::batch_processor
batch_processor(log_writer_ptr writer, const config &cfg=config{})
Constructor.
Definition batch_processor.cpp:119

kcenon::logger::async::batch_processor::~batch_processor
~batch_processor()
Destructor.
Definition batch_processor.cpp:141

kcenon::logger::async::batch_processor::processing_worker_
std::unique_ptr< batch_processing_jthread_worker > processing_worker_
Definition batch_processor.h:257

kcenon::logger::async::batch_processor::current_batch_size_
std::atomic< size_t > current_batch_size_
Definition batch_processor.h:266

kcenon::logger::async::batch_processor::update_stats
void update_stats(size_t batch_size, std::chrono::nanoseconds processing_time, const std::string &flush_reason)
Update processing statistics.
Definition batch_processor.cpp:383

kcenon::logger::async::batch_processor::start
bool start()
Start the batch processor.
Definition batch_processor.cpp:145

kcenon::logger::async::batch_processor::stats_
processing_stats stats_
Definition batch_processor.h:270

kcenon::logger::async::batch_processor::add_entry
bool add_entry(batch_entry &&entry)
Add entry to the batch queue.
Definition batch_processor.cpp:193

kcenon::logger::async::batch_processor::collect_entries
size_t collect_entries(std::vector< batch_entry > &batch, size_t max_entries, std::chrono::steady_clock::time_point deadline)
Collect entries for batch processing.
Definition batch_processor.cpp:279

kcenon::logger::async::batch_processor::queue_
std::unique_ptr< lockfree_spsc_queue< batch_entry, queue_size > > queue_
Definition batch_processor.h:254

kcenon::logger::async::batch_processor::process_batch
size_t process_batch(std::vector< batch_entry > &batch)
Process current batch.
Definition batch_processor.cpp:310

kcenon::logger::async::batch_processor::should_stop_
std::atomic< bool > should_stop_
Definition batch_processor.h:259

kcenon::logger::async::batch_processor::adjust_batch_size
void adjust_batch_size()
Adjust batch size based on performance metrics.
Definition batch_processor.cpp:336

kcenon::logger::async::batch_processor::is_healthy
bool is_healthy() const
Check if processor is healthy.
Definition batch_processor.cpp:218

kcenon::logger::async::batch_processor::recent_queue_size_
std::atomic< size_t > recent_queue_size_
Definition batch_processor.h:274

kcenon::logger::async::batch_processor::writer_
log_writer_ptr writer_
Definition batch_processor.h:250

kcenon::logger::async::batch_processor::notify_cv_
std::condition_variable notify_cv_
Definition batch_processor.h:263

kcenon::logger::async::batch_processor::notify_mutex_
std::mutex notify_mutex_
Definition batch_processor.h:262

kcenon::logger::async::batch_processor::process_loop_iteration
void process_loop_iteration()
Single iteration of processing loop.
Definition batch_processor.cpp:227

kcenon::logger::async::batch_processor::queue_size
static constexpr size_t queue_size
Definition batch_processor.h:253

kcenon::logger::async::batch_processor::flush
void flush()
Force flush current batch.
Definition batch_processor.cpp:213

kcenon::logger::async::batch_processor::should_flush_by_time
bool should_flush_by_time(std::chrono::steady_clock::time_point last_flush_time) const
Check if batch should be flushed based on time.
Definition batch_processor.cpp:375

kcenon::logger::async::batch_processor::running_
std::atomic< bool > running_
Definition batch_processor.h:258

kcenon::logger::async::batch_processor::handle_back_pressure
bool handle_back_pressure()
Handle back-pressure conditions.
Definition batch_processor.cpp:360

kcenon::logger::async::batch_processor::get_queue_size
size_t get_queue_size() const
Get current queue size.
Definition batch_processor.cpp:223

kcenon::logger::async::batch_processor::recent_processing_time_ms_
std::atomic< double > recent_processing_time_ms_
Definition batch_processor.h:273

kcenon::logger::async::batch_processor::config_
config config_
Definition batch_processor.h:247

kcenon::logger::async::compat_jthread
Wrapper for std::jthread or std::thread with manual stop mechanism.
Definition jthread_compat.h:84

kcenon::logger::async::compat_jthread::request_stop
void request_stop()
Request the thread to stop.
Definition jthread_compat.h:166

kcenon::logger::async::compat_jthread::join
void join()
Wait for thread to complete.
Definition jthread_compat.h:179

kcenon::logger::async::lockfree_spsc_queue
Lock-free single-producer single-consumer queue.
Definition lockfree_queue.h:35

kcenon::logger::async::simple_stop_source
Simple stop source for environments without std::stop_token.
Definition jthread_compat.h:48

kcenon::logger::result
Definition error_codes.h:436

jthread_compat.h
Compatibility header for std::jthread and std::stop_token kcenon.

LOGGER_HAS_JTHREAD
#define LOGGER_HAS_JTHREAD
Definition jthread_compat.h:37

kcenon::logger::async
Definition async_worker.cpp:10

kcenon::logger::async::make_batch_processor
std::unique_ptr< batch_processor > make_batch_processor(log_writer_ptr writer, const batch_processor::config &cfg)
Factory function to create a batch processor.
Definition batch_processor.cpp:414

kcenon::logger::log_writer_ptr
std::unique_ptr< log_writer_interface > log_writer_ptr
Type alias for writer unique pointer.
Definition log_writer_interface.h:151

object_pool.h
Object pool implementation for high-performance memory management.

kcenon::logger::async::batch_processor::batch_entry
Batch entry structure.
Definition batch_processor.h:64

kcenon::logger::async::batch_processor::config
Configuration for batch processor.
Definition batch_processor.h:41

kcenon::logger::async::batch_processor::config::size_decrease_factor
double size_decrease_factor
Factor for decreasing batch size.
Definition batch_processor.h:53

kcenon::logger::async::batch_processor::config::back_pressure_delay
std::chrono::microseconds back_pressure_delay
Delay when under back-pressure.
Definition batch_processor.h:56

kcenon::logger::async::batch_processor::config::max_batch_size
size_t max_batch_size
Maximum batch size.
Definition batch_processor.h:44

kcenon::logger::async::batch_processor::config::min_batch_size
size_t min_batch_size
Minimum batch size.
Definition batch_processor.h:43

kcenon::logger::async::batch_processor::config::enable_back_pressure
bool enable_back_pressure
Enable back-pressure handling.
Definition batch_processor.h:50

kcenon::logger::async::batch_processor::config::initial_batch_size
size_t initial_batch_size
Initial batch size.
Definition batch_processor.h:42

kcenon::logger::async::batch_processor::config::enable_dynamic_sizing
bool enable_dynamic_sizing
Enable dynamic batch sizing.
Definition batch_processor.h:49

kcenon::logger::async::batch_processor::config::back_pressure_threshold
size_t back_pressure_threshold
Queue size threshold for back-pressure.
Definition batch_processor.h:55

kcenon::logger::async::batch_processor::config::size_increase_factor
double size_increase_factor
Factor for increasing batch size.
Definition batch_processor.h:52

kcenon::logger::async::batch_processor::processing_stats::dynamic_size_adjustments
std::atomic< uint64_t > dynamic_size_adjustments
Definition batch_processor.h:96

kcenon::logger::async::batch_processor::processing_stats::flush_by_time
std::atomic< uint64_t > flush_by_time
Definition batch_processor.h:99

kcenon::logger::async::batch_processor::processing_stats::flush_by_size
std::atomic< uint64_t > flush_by_size
Definition batch_processor.h:98

kcenon::logger::async::batch_processor::processing_stats::dropped_entries
std::atomic< uint64_t > dropped_entries
Definition batch_processor.h:94

kcenon::logger::async::batch_processor::processing_stats::average_batch_size
std::atomic< double > average_batch_size
Definition batch_processor.h:102

kcenon::logger::async::batch_processor::processing_stats::average_processing_time_ms
std::atomic< double > average_processing_time_ms
Definition batch_processor.h:103

kcenon::logger::async::batch_processor::processing_stats::back_pressure_events
std::atomic< uint64_t > back_pressure_events
Definition batch_processor.h:95

kcenon::logger::async::batch_processor::processing_stats::total_batches
std::atomic< uint64_t > total_batches
Definition batch_processor.h:92

kcenon::logger::async::batch_processor::processing_stats::total_entries
std::atomic< uint64_t > total_entries
Definition batch_processor.h:93

kcenon::logger::log_entry
Represents a single log entry with all associated metadata.
Definition log_entry.h:155