diff --git a/include/tgfx/core/Task.h b/include/tgfx/core/Task.h index 05e6c86b..c1936f45 100644 --- a/include/tgfx/core/Task.h +++ b/include/tgfx/core/Task.h @@ -18,6 +18,7 @@ #pragma once +#include #include #include #include @@ -27,31 +28,38 @@ namespace tgfx { class TaskGroup; /** - * The Task class manages the concurrent execution of one or more code blocks. + * Defines the possible states of a Task. */ -class Task { - public: +enum class TaskStatus { /** - * Submits a code block for asynchronous execution immediately and returns a Task wraps the code - * block. Hold a reference to the returned Task if you want to cancel it or wait for it to finish - * execution. Returns nullptr if the block is nullptr. + * The Task is waiting to be executed. */ - static std::shared_ptr Run(std::function block); - + Queueing, /** - * Returns true if the Task is currently executing its code block. + * The Task is currently executing. */ - bool executing(); - + Executing, /** - * Returns true if the Task has been cancelled + * The Task has finished executing. */ - bool cancelled(); + Finished, + /** + * The Task has been canceled. + */ + Canceled +}; +/** + * The Task class manages the concurrent execution of one or more code blocks. + */ +class Task { + public: /** - * Returns true if the Task has finished executing its code block. + * Submits a code block for asynchronous execution immediately and returns a Task wraps the code + * block. Hold a reference to the returned Task if you want to cancel it or wait for it to finish + * execution. Returns nullptr if the block is nullptr. */ - bool finished(); + static std::shared_ptr Run(std::function block); /** * Advises the Task that it should stop executing its code block. Cancellation does not affect the @@ -62,16 +70,20 @@ class Task { /** * Blocks the current thread until the Task finishes its execution. Returns immediately if the * Task is finished or canceled. The task may be executed on the calling thread if it is not - * cancelled and still in the queue. + * canceled and still in the queue. */ void wait(); + /** + * Return the current status of the Task. + */ + TaskStatus status() const; + private: std::mutex locker = {}; std::condition_variable condition = {}; - bool _executing = true; - bool _cancelled = false; std::function block = nullptr; + std::atomic _status = TaskStatus::Queueing; explicit Task(std::function block); void execute(); diff --git a/src/core/utils/LockFreeQueue.h b/src/core/utils/LockFreeQueue.h index 4232ddd7..d39d78cc 100644 --- a/src/core/utils/LockFreeQueue.h +++ b/src/core/utils/LockFreeQueue.h @@ -33,21 +33,27 @@ namespace tgfx { static constexpr size_t CACHELINE_SIZE = 64; -// QUEUE_SIZE needs to be a power of 2, otherwise the implementation of GetIndex needs to be changed. -static constexpr uint32_t QUEUE_SIZE = 1024; - -inline uint32_t GetIndex(uint32_t position) { - return position & (QUEUE_SIZE - 1); -} template class LockFreeQueue { public: - LockFreeQueue() { - queuePool = reinterpret_cast(std::calloc(QUEUE_SIZE, sizeof(T))); + /** + * The capacity needs to be a power of 2, otherwise, it will be automatically set to the nearest + * power of 2 larger than the capacity. + * @param capacity + */ + explicit LockFreeQueue(uint32_t capacity) { + if ((capacity & (capacity - 1)) != 0) { + _capacity = 1; + while (_capacity < capacity) { + _capacity <<= 1; + } + } else { + _capacity = capacity; + } + queuePool = reinterpret_cast(std::calloc(_capacity, sizeof(T))); if (queuePool == nullptr) { - LOGE("LockFreeQueue init Failed!\n"); - return; + ABORT("LockFreeQueue init Failed!\n"); } } @@ -59,9 +65,6 @@ class LockFreeQueue { } T dequeue() { - if (queuePool == nullptr) { - return nullptr; - } uint32_t newHead = 0; uint32_t oldHead = head.load(std::memory_order_relaxed); T element = nullptr; @@ -71,11 +74,11 @@ class LockFreeQueue { if (newHead == tailPosition.load(std::memory_order_acquire)) { return nullptr; } - element = queuePool[GetIndex(newHead)]; + element = queuePool[getIndex(newHead)]; } while (!head.compare_exchange_weak(oldHead, newHead, std::memory_order_acq_rel, std::memory_order_relaxed)); - queuePool[GetIndex(newHead)] = nullptr; + queuePool[getIndex(newHead)] = nullptr; uint32_t newHeadPosition = 0; uint32_t oldHeadPosition = headPosition.load(std::memory_order_relaxed); @@ -87,22 +90,19 @@ class LockFreeQueue { } bool enqueue(const T& element) { - if (queuePool == nullptr) { - return false; - } uint32_t newTail = 0; uint32_t oldTail = tail.load(std::memory_order_relaxed); do { - newTail = oldTail + 1; - if (GetIndex(newTail) == GetIndex(headPosition.load(std::memory_order_acquire))) { - LOGI("The queue has reached its maximum capacity, capacity: %u!\n", QUEUE_SIZE); + if (getIndex(oldTail) == getIndex(headPosition.load(std::memory_order_acquire))) { + LOGI("The queue has reached its maximum capacity, capacity: %u!\n", _capacity); return false; } + newTail = oldTail + 1; } while (!tail.compare_exchange_weak(oldTail, newTail, std::memory_order_acq_rel, std::memory_order_relaxed)); - queuePool[GetIndex(oldTail)] = std::move(element); + queuePool[getIndex(oldTail)] = std::move(element); uint32_t newTailPosition = 0; uint32_t oldTailPosition = tailPosition.load(std::memory_order_relaxed); @@ -115,6 +115,7 @@ class LockFreeQueue { private: T* queuePool = nullptr; + uint32_t _capacity = 0; #ifdef DISABLE_ALIGNAS // head indicates the position after requesting space. std::atomic head = {0}; @@ -134,6 +135,10 @@ class LockFreeQueue { // tailPosition indicates the position after filling data. alignas(CACHELINE_SIZE) std::atomic tailPosition = {1}; #endif + + uint32_t getIndex(uint32_t position) { + return position & (_capacity - 1); + } }; } // namespace tgfx diff --git a/src/core/utils/Task.cpp b/src/core/utils/Task.cpp index ec406860..669dd714 100644 --- a/src/core/utils/Task.cpp +++ b/src/core/utils/Task.cpp @@ -34,42 +34,54 @@ std::shared_ptr Task::Run(std::function block) { Task::Task(std::function block) : block(std::move(block)) { } -bool Task::executing() { - std::lock_guard autoLock(locker); - return _executing; -} - -bool Task::cancelled() { - std::lock_guard autoLock(locker); - return _cancelled; -} - -bool Task::finished() { - std::lock_guard autoLock(locker); - return !_executing && !_cancelled; -} - void Task::wait() { - std::unique_lock autoLock(locker); - if (!_executing) { + auto oldStatus = _status.load(std::memory_order_relaxed); + if (oldStatus == TaskStatus::Canceled || oldStatus == TaskStatus::Finished) { return; } - condition.wait(autoLock); + // If wait() is called from the thread pool, all threads might block, leaving no thread to execute + // this task. To avoid deadlock, execute the task directly on the current thread if it's queued. + if (oldStatus == TaskStatus::Queueing) { + if (_status.compare_exchange_weak(oldStatus, TaskStatus::Executing, std::memory_order_acq_rel, + std::memory_order_relaxed)) { + block(); + oldStatus = TaskStatus::Executing; + while (!_status.compare_exchange_weak(oldStatus, TaskStatus::Finished, + std::memory_order_acq_rel, std::memory_order_relaxed)) + ; + return; + } + } + std::unique_lock autoLock(locker); + if (_status.load(std::memory_order_acquire) == TaskStatus::Executing) { + condition.wait(autoLock); + } } void Task::cancel() { - std::unique_lock autoLock(locker); - if (!_executing) { - return; + auto currentStatus = _status.load(std::memory_order_relaxed); + if (currentStatus == TaskStatus::Queueing) { + _status.compare_exchange_weak(currentStatus, TaskStatus::Canceled, std::memory_order_acq_rel, + std::memory_order_relaxed); } - _executing = false; - _cancelled = true; } void Task::execute() { - block(); - std::lock_guard auoLock(locker); - _executing = false; - condition.notify_all(); + auto oldStatus = _status.load(std::memory_order_relaxed); + if (oldStatus == TaskStatus::Queueing && + _status.compare_exchange_weak(oldStatus, TaskStatus::Executing, std::memory_order_acq_rel, + std::memory_order_relaxed)) { + block(); + oldStatus = TaskStatus::Executing; + while (!_status.compare_exchange_weak(oldStatus, TaskStatus::Finished, + std::memory_order_acq_rel, std::memory_order_relaxed)) + ; + std::unique_lock autoLock(locker); + condition.notify_all(); + } +} + +TaskStatus Task::status() const { + return _status.load(std::memory_order_relaxed); } } // namespace tgfx diff --git a/src/core/utils/TaskGroup.cpp b/src/core/utils/TaskGroup.cpp index f1edfa54..1acff944 100644 --- a/src/core/utils/TaskGroup.cpp +++ b/src/core/utils/TaskGroup.cpp @@ -28,6 +28,8 @@ namespace tgfx { static constexpr auto THREAD_TIMEOUT = std::chrono::seconds(10); +static constexpr uint32_t THREAD_POOL_SIZE = 32; +static constexpr uint32_t TASK_QUEUE_SIZE = 1024; int GetCPUCores() { int cpuCores = 0; @@ -44,9 +46,6 @@ int GetCPUCores() { return cpuCores; } -static const int CPUCores = GetCPUCores(); -static const int MaxThreads = CPUCores > 16 ? 16 : CPUCores; - TaskGroup* TaskGroup::GetInstance() { static auto& taskGroup = *new TaskGroup(); return &taskGroup; @@ -76,15 +75,18 @@ void OnAppExit() { } TaskGroup::TaskGroup() { + threads = new LockFreeQueue(THREAD_POOL_SIZE); + tasks = new LockFreeQueue>(TASK_QUEUE_SIZE); std::atexit(OnAppExit); - threads.resize(static_cast(MaxThreads), nullptr); } bool TaskGroup::checkThreads() { + static const int CPUCores = GetCPUCores(); + static const int MaxThreads = CPUCores > 16 ? 16 : CPUCores; if (waitingThreads == 0 && totalThreads < MaxThreads) { auto thread = new (std::nothrow) std::thread(&TaskGroup::RunLoop, this); if (thread) { - threads[static_cast(totalThreads)] = thread; + threads->enqueue(thread); totalThreads++; } } else { @@ -100,7 +102,7 @@ bool TaskGroup::pushTask(std::shared_ptr task) { if (exited || !checkThreads()) { return false; } - if (!tasks.enqueue(std::move(task))) { + if (!tasks->enqueue(std::move(task))) { return false; } if (waitingThreads > 0) { @@ -112,7 +114,7 @@ bool TaskGroup::pushTask(std::shared_ptr task) { std::shared_ptr TaskGroup::popTask() { std::unique_lock autoLock(locker); while (!exited) { - auto task = tasks.dequeue(); + auto task = tasks->dequeue(); if (task) { return task; } @@ -129,12 +131,12 @@ std::shared_ptr TaskGroup::popTask() { void TaskGroup::exit() { exited = true; condition.notify_all(); - for (int i = 0; i < totalThreads; i++) { - auto thread = threads[static_cast(i)]; - if (thread) { - ReleaseThread(thread); - } + std::thread* thread = nullptr; + while ((thread = threads->dequeue()) != nullptr) { + ReleaseThread(thread); } + delete threads; + delete tasks; totalThreads = 0; waitingThreads = 0; } diff --git a/src/core/utils/TaskGroup.h b/src/core/utils/TaskGroup.h index 6d977ea4..4fb15424 100644 --- a/src/core/utils/TaskGroup.h +++ b/src/core/utils/TaskGroup.h @@ -34,8 +34,8 @@ class TaskGroup { std::atomic_int totalThreads = 0; std::atomic_bool exited = false; std::atomic_int waitingThreads = 0; - LockFreeQueue> tasks = {}; - std::vector threads = {}; + LockFreeQueue>* tasks = nullptr; + LockFreeQueue* threads = nullptr; static TaskGroup* GetInstance(); static void RunLoop(TaskGroup* taskGroup);