/home/users/khuck/src/hpx-lsu/hpx/runtime/threads/policies/thread_queue.hpp


//  Copyright (c) 2007-2016 Hartmut Kaiser
//  Copyright (c) 2011      Bryce Lelbach
//
//  Distributed under the Boost Software License, Version 1.0. (See accompanying
//  file LICENSE_1_0.txt or copy at http://www.boost.org/LICENSE_1_0.txt)

#if !defined(HPX_THREADMANAGER_THREAD_QUEUE_AUG_25_2009_0132PM)
#define HPX_THREADMANAGER_THREAD_QUEUE_AUG_25_2009_0132PM

#include <hpx/config.hpp>
#include <hpx/error_code.hpp>
#include <hpx/runtime/threads/policies/lockfree_queue_backends.hpp>
#include <hpx/runtime/threads/policies/queue_helpers.hpp>
#include <hpx/runtime/threads/thread_data.hpp>
#include <hpx/throw_exception.hpp>
#include <hpx/util/assert.hpp>
#include <hpx/util/block_profiler.hpp>
#include <hpx/util/function.hpp>
#include <hpx/util/get_and_reset_value.hpp>
#include <hpx/util/high_resolution_clock.hpp>
#include <hpx/util/unlock_guard.hpp>

#ifdef HPX_HAVE_THREAD_CREATION_AND_CLEANUP_RATES
#   include <hpx/util/tick_counter.hpp>
#endif

#include <boost/atomic.hpp>
#include <boost/exception_ptr.hpp>
#include <boost/thread/condition.hpp>
#include <boost/thread/mutex.hpp>

#include <cstddef>
#include <cstdint>
#include <functional>
#include <list>
#include <map>
#include <memory>
#include <mutex>
#include <unordered_set>
#include <utility>
#include <vector>

///////////////////////////////////////////////////////////////////////////////
namespace std
{
    template <>
    struct hash< ::hpx::threads::thread_id_type>
    {
        typedef ::hpx::threads::thread_id_type argument_type;
        typedef std::size_t result_type;

        std::size_t operator()(::hpx::threads::thread_id_type const& v) const
        {
            std::hash<std::size_t> hasher_;
            return hasher_(reinterpret_cast<std::size_t>(v.get()));
        }
    };
}

///////////////////////////////////////////////////////////////////////////////
namespace hpx { namespace threads { namespace policies
{
#ifdef HPX_HAVE_THREAD_QUEUE_WAITTIME
    ///////////////////////////////////////////////////////////////////////////
    // We control whether to collect queue wait times using this global bool.
    // It will be set by any of the related performance counters. Once set it
    // stays set, thus no race conditions will occur.
    extern bool maintain_queue_wait_times;
#endif
#ifdef HPX_HAVE_THREAD_MINIMAL_DEADLOCK_DETECTION
    ///////////////////////////////////////////////////////////////////////////
    // We globally control whether to do minimal deadlock detection using this
    // global bool variable. It will be set once by the runtime configuration
    // startup code
    extern bool minimal_deadlock_detection;
#endif

    ///////////////////////////////////////////////////////////////////////////
    // // Queue back-end interface:
    //
    // template <typename T>
    // struct queue_backend
    // {
    //     typedef ... container_type;
    //     typedef ... value_type;
    //     typedef ... reference;
    //     typedef ... const_reference;
    //     typedef ... size_type;
    //
    //     queue_backend(
    //         size_type initial_size = ...
    //       , size_type num_thread = ...
    //         );
    //
    //     bool push(const_reference val);
    //
    //     bool pop(reference val, bool steal = true);
    //
    //     bool empty();
    // };
    //
    // struct queue_policy
    // {
    //     template <typename T>
    //     struct apply
    //     {
    //         typedef ... type;
    //     };
    // };
    template <typename Mutex = boost::mutex,
        typename PendingQueuing = lockfree_lifo,
        typename StagedQueuing = lockfree_lifo,
        typename TerminatedQueuing = lockfree_fifo>
    class thread_queue
    {
    private:
        // we use a simple mutex to protect the data members for now
        typedef Mutex mutex_type;

        // Add this number of threads to the work items queue each time the
        // function \a add_new() is called if the queue is empty.
        enum {
            min_add_new_count = 10,
            max_add_new_count = 10,
            max_delete_count = 1000
        };

        // this is the type of a map holding all threads (except depleted ones)
        typedef std::unordered_set<thread_id_type> thread_map_type;

#ifdef HPX_HAVE_THREAD_QUEUE_WAITTIME
        typedef
            util::tuple<thread_init_data, thread_state_enum, std::uint64_t>
        task_description;
#else
        typedef util::tuple<thread_init_data, thread_state_enum> task_description;
#endif

#ifdef HPX_HAVE_THREAD_QUEUE_WAITTIME
        typedef util::tuple<thread_data*, std::uint64_t> thread_description;
#else
        typedef thread_data thread_description;
#endif

        typedef typename PendingQueuing::template
            apply<thread_description*>::type work_items_type;

        typedef typename StagedQueuing::template
            apply<task_description*>::type task_items_type;

        typedef typename TerminatedQueuing::template
            apply<thread_data*>::type terminated_items_type;

    protected:
        template <typename Lock>
        void create_thread_object(threads::thread_id_type& thrd,
            threads::thread_init_data& data, thread_state_enum state, Lock& lk)
        {
            HPX_ASSERT(lk.owns_lock());
            HPX_ASSERT(data.stacksize != 0);

            std::ptrdiff_t stacksize = data.stacksize;

            std::list<thread_id_type>* heap = nullptr;

            if (stacksize == get_stack_size(thread_stacksize_small))
            {
                heap = &thread_heap_small_;
            }
            else if (stacksize == get_stack_size(thread_stacksize_medium))
            {
                heap = &thread_heap_medium_;
            }
            else if (stacksize == get_stack_size(thread_stacksize_large))
            {
                heap = &thread_heap_large_;
            }
            else if (stacksize == get_stack_size(thread_stacksize_huge))
            {
                heap = &thread_heap_huge_;
            }
            else {
                switch(stacksize) {
                case thread_stacksize_small:
                    heap = &thread_heap_small_;
                    break;

                case thread_stacksize_medium:
                    heap = &thread_heap_medium_;
                    break;

                case thread_stacksize_large:
                    heap = &thread_heap_large_;
                    break;

                case thread_stacksize_huge:
                    heap = &thread_heap_huge_;
                    break;

                default:
                    break;
                }
            }
            HPX_ASSERT(heap);

            // Check for an unused thread object.
            if (!heap->empty())
            {
                // Take ownership of the thread object and rebind it.
                thrd = heap->front();
                heap->pop_front();
                thrd->rebind(data,
                    state == pending_do_not_schedule ? pending : state);
            }

            else
            {
                hpx::util::unlock_guard<Lock> ull(lk);

                // Allocate a new thread object.
                thrd = threads::thread_data::create(
                    data, memory_pool_,
                    state == pending_do_not_schedule ? pending : state);
            }
        }

        ///////////////////////////////////////////////////////////////////////
        // add new threads if there is some amount of work available
        std::size_t add_new(std::int64_t add_count, thread_queue* addfrom,
            std::unique_lock<mutex_type> &lk, bool steal = false)
        {
            HPX_ASSERT(lk.owns_lock());

            if (HPX_UNLIKELY(0 == add_count))
                return 0;

            std::size_t added = 0;
            task_description* task = nullptr;
            while (add_count-- && addfrom->new_tasks_.pop(task, steal))
            {
#ifdef HPX_HAVE_THREAD_QUEUE_WAITTIME
                if (maintain_queue_wait_times) {
                    addfrom->new_tasks_wait_ +=
                        util::high_resolution_clock::now() - util::get<2>(*task);
                    ++addfrom->new_tasks_wait_count_;
                }
#endif
                --addfrom->new_tasks_count_;

                // measure thread creation time
                util::block_profiler_wrapper<add_new_tag> bp(add_new_logger_);

                // create the new thread
                threads::thread_init_data& data = util::get<0>(*task);
                thread_state_enum state = util::get<1>(*task);
                threads::thread_id_type thrd;

                create_thread_object(thrd, data, state, lk);

                delete task;

                // add the new entry to the map of all threads
                std::pair<thread_map_type::iterator, bool> p =
                    thread_map_.insert(thrd);

                if (HPX_UNLIKELY(!p.second)) {
                    HPX_THROW_EXCEPTION(hpx::out_of_memory,
                        "threadmanager::add_new",
                        "Couldn't add new thread to the thread map");
                    return 0;
                }
                ++thread_map_count_;

                // only insert the thread into the work-items queue if it is in
                // pending state
                if (state == pending) {
                    // pushing the new thread into the pending queue of the
                    // specified thread_queue
                    ++added;
                    schedule_thread(thrd.get());
                }

                // this thread has to be in the map now
                HPX_ASSERT(thread_map_.find(thrd.get()) != thread_map_.end());
                HPX_ASSERT(thrd->get_pool() == &memory_pool_);
            }

            if (added) {
                LTM_(debug) << "add_new: added " << added << " tasks to queues"; //-V128
            }
            return added;
        }

        ///////////////////////////////////////////////////////////////////////
        bool add_new_if_possible(std::size_t& added, thread_queue* addfrom,
            std::unique_lock<mutex_type> &lk, bool steal = false)
        {
            HPX_ASSERT(lk.owns_lock());

#ifdef HPX_HAVE_THREAD_CREATION_AND_CLEANUP_RATES
            util::tick_counter tc(add_new_time_);
#endif

            if (0 == addfrom->new_tasks_count_.load(boost::memory_order_relaxed))
                return false;

            // create new threads from pending tasks (if appropriate)
            std::int64_t add_count = -1;                  // default is no constraint

            // if the map doesn't hold max_count threads yet add some
            // FIXME: why do we have this test? can max_count_ ever be zero?
            if (HPX_LIKELY(max_count_)) {
                std::size_t count = thread_map_.size();
                if (max_count_ >= count + min_add_new_count) { //-V104
                    HPX_ASSERT(max_count_ - count <
                        static_cast<std::size_t>((std::numeric_limits
                            <std::int64_t>::max)()));
                    add_count = static_cast<std::int64_t>(max_count_ - count);
                    if (add_count < min_add_new_count)
                        add_count = min_add_new_count;
                }
                else {
                    return false;
                }
            }

            std::size_t addednew = add_new(add_count, addfrom, lk, steal);
            added += addednew;
            return addednew != 0;
        }

        ///////////////////////////////////////////////////////////////////////
        bool add_new_always(std::size_t& added, thread_queue* addfrom,
            std::unique_lock<mutex_type> &lk, bool steal = false)
        {
            HPX_ASSERT(lk.owns_lock());

#ifdef HPX_HAVE_THREAD_CREATION_AND_CLEANUP_RATES
            util::tick_counter tc(add_new_time_);
#endif

            if (0 == addfrom->new_tasks_count_.load(boost::memory_order_relaxed))
                return false;

            // create new threads from pending tasks (if appropriate)
            std::int64_t add_count = -1;                  // default is no constraint

            // if we are desperate (no work in the queues), add some even if the
            // map holds more than max_count
            if (HPX_LIKELY(max_count_)) {
                std::size_t count = thread_map_.size();
                if (max_count_ >= count + min_add_new_count) { //-V104
                    HPX_ASSERT(max_count_ - count <
                        static_cast<std::size_t>((std::numeric_limits
                            <std::int64_t>::max)()));
                    add_count = static_cast<std::int64_t>(max_count_ - count);
                    if (add_count < min_add_new_count)
                        add_count = min_add_new_count;
                    if (add_count > max_add_new_count)
                        add_count = max_add_new_count;
                }
                else if (work_items_.empty()) {
                    add_count = min_add_new_count;    // add this number of threads
                    max_count_ += min_add_new_count;  // increase max_count //-V101
                }
                else {
                    return false;
                }
            }

            std::size_t addednew = add_new(add_count, addfrom, lk, steal);
            added += addednew;
            return addednew != 0;
        }

        void recycle_thread(thread_id_type thrd)
        {
            std::ptrdiff_t stacksize = thrd->get_stack_size();

            if (stacksize == get_stack_size(thread_stacksize_small))
            {
                thread_heap_small_.push_front(thrd);
            }
            else if (stacksize == get_stack_size(thread_stacksize_medium))
            {
                thread_heap_medium_.push_front(thrd);
            }
            else if (stacksize == get_stack_size(thread_stacksize_large))
            {
                thread_heap_large_.push_front(thrd);
            }
            else if (stacksize == get_stack_size(thread_stacksize_huge))
            {
                thread_heap_huge_.push_front(thrd);
            }
            else
            {
                switch(stacksize) {
                case thread_stacksize_small:
                    thread_heap_small_.push_front(thrd);
                    break;

                case thread_stacksize_medium:
                    thread_heap_medium_.push_front(thrd);
                    break;

                case thread_stacksize_large:
                    thread_heap_large_.push_front(thrd);
                    break;

                case thread_stacksize_huge:
                    thread_heap_huge_.push_front(thrd);
                    break;

                default:
                    HPX_ASSERT(false);
                    break;
                }
            }
        }

    public:
        /// This function makes sure all threads which are marked for deletion
        /// (state is terminated) are properly destroyed.
        ///
        /// This returns 'true' if there are no more terminated threads waiting
        /// to be deleted.
        bool cleanup_terminated_locked_helper(bool delete_all = false)
        {
#ifdef HPX_HAVE_THREAD_CREATION_AND_CLEANUP_RATES
            util::tick_counter tc(cleanup_terminated_time_);
#endif

            if (terminated_items_count_ == 0 && thread_map_.empty())
                return true;

            if (delete_all) {
                // delete all threads
                thread_data* todelete;
                while (terminated_items_.pop(todelete))
                {
                    --terminated_items_count_;

                    // this thread has to be in this map
                    HPX_ASSERT(thread_map_.find(todelete) != thread_map_.end());

                    bool deleted = thread_map_.erase(todelete) != 0;
                    HPX_ASSERT(deleted);
                    if (deleted) {
                        --thread_map_count_;
                        HPX_ASSERT(thread_map_count_ >= 0);
                    }
                }
            }
            else {
                // delete only this many threads
                std::int64_t delete_count =
                    (std::max)(
                        static_cast<std::int64_t>(terminated_items_count_ / 10),
                        static_cast<std::int64_t>(max_delete_count));

                thread_data* todelete;
                while (delete_count && terminated_items_.pop(todelete))
                {
                    --terminated_items_count_;

                    thread_map_type::iterator it = thread_map_.find(todelete);

                    // this thread has to be in this map
                    HPX_ASSERT(it != thread_map_.end());

                    recycle_thread(*it);

                    thread_map_.erase(it);
                    --thread_map_count_;
                    HPX_ASSERT(thread_map_count_ >= 0);

                    --delete_count;
                }
            }
            return terminated_items_count_ == 0;
        }

        bool cleanup_terminated_locked(bool delete_all = false)
        {
            return cleanup_terminated_locked_helper(delete_all) &&
                thread_map_.empty();
        }

    public:
        bool cleanup_terminated(bool delete_all = false)
        {
            if (terminated_items_count_ == 0)
                return thread_map_count_ == 0;

            if (delete_all) {
                // do not lock mutex while deleting all threads, do it piece-wise
                bool thread_map_is_empty = false;
                while (true)
                {
                    std::lock_guard<mutex_type> lk(mtx_);
                    if (cleanup_terminated_locked_helper(false))
                    {
                        thread_map_is_empty =
                            (thread_map_count_ == 0) && (new_tasks_count_ == 0);
                        break;
                    }
                }
                return thread_map_is_empty;
            }

            std::lock_guard<mutex_type> lk(mtx_);
            return cleanup_terminated_locked_helper(false) &&
                (thread_map_count_ == 0) && (new_tasks_count_ == 0);
        }

        // The maximum number of active threads this thread manager should
        // create. This number will be a constraint only as long as the work
        // items queue is not empty. Otherwise the number of active threads
        // will be incremented in steps equal to the \a min_add_new_count
        // specified above.
        enum { max_thread_count = 1000 };

        thread_queue(std::size_t queue_num = std::size_t(-1),
                std::size_t max_count = max_thread_count)
          : thread_map_count_(0),
            work_items_(128, queue_num),
            work_items_count_(0),
#ifdef HPX_HAVE_THREAD_QUEUE_WAITTIME
            work_items_wait_(0),
            work_items_wait_count_(0),
#endif
            terminated_items_(128),
            terminated_items_count_(0),
            max_count_((0 == max_count)
                      ? static_cast<std::size_t>(max_thread_count)
                      : max_count),
            new_tasks_(128),
            new_tasks_count_(0),
#ifdef HPX_HAVE_THREAD_QUEUE_WAITTIME
            new_tasks_wait_(0),
            new_tasks_wait_count_(0),
#endif
            memory_pool_(64),
            thread_heap_small_(),
            thread_heap_medium_(),
            thread_heap_large_(),
            thread_heap_huge_(),
#ifdef HPX_HAVE_THREAD_CREATION_AND_CLEANUP_RATES
            add_new_time_(0),
            cleanup_terminated_time_(0),
#endif
#ifdef HPX_HAVE_THREAD_STEALING_COUNTS
            pending_misses_(0),
            pending_accesses_(0),
            stolen_from_pending_(0),
            stolen_from_staged_(0),
            stolen_to_pending_(0),
            stolen_to_staged_(0),
#endif
            add_new_logger_("thread_queue::add_new")
        {}

        void set_max_count(std::size_t max_count = max_thread_count)
        {
            max_count_ = (0 == max_count) ? max_thread_count : max_count; //-V105
        }

#ifdef HPX_HAVE_THREAD_CREATION_AND_CLEANUP_RATES
        std::uint64_t get_creation_time(bool reset)
        {
            return util::get_and_reset_value(add_new_time_, reset);
        }

        std::uint64_t get_cleanup_time(bool reset)
        {
            return util::get_and_reset_value(cleanup_terminated_time_, reset);
        }
#endif

        ///////////////////////////////////////////////////////////////////////
        // This returns the current length of the queues (work items and new items)
        std::int64_t get_queue_length() const
        {
            return work_items_count_ + new_tasks_count_;
        }

        // This returns the current length of the pending queue
        std::int64_t get_pending_queue_length() const
        {
            return work_items_count_;
        }

        // This returns the current length of the staged queue
        std::int64_t get_staged_queue_length(
            boost::memory_order order = boost::memory_order_seq_cst) const
        {
            return new_tasks_count_.load(order);
        }

#ifdef HPX_HAVE_THREAD_QUEUE_WAITTIME
        std::uint64_t get_average_task_wait_time() const
        {
            std::uint64_t count = new_tasks_wait_count_;
            if (count == 0)
                return 0;
            return new_tasks_wait_ / count;
        }

        std::uint64_t get_average_thread_wait_time() const
        {
            std::uint64_t count = work_items_wait_count_;
            if (count == 0)
                return 0;
            return work_items_wait_ / count;
        }
#endif

#ifdef HPX_HAVE_THREAD_STEALING_COUNTS
        std::int64_t get_num_pending_misses(bool reset)
        {
            return util::get_and_reset_value(pending_misses_, reset);
        }

        void increment_num_pending_misses(std::size_t num = 1)
        {
            pending_misses_ += num;
        }

        std::int64_t get_num_pending_accesses(bool reset)
        {
            return util::get_and_reset_value(pending_accesses_, reset);
        }

        void increment_num_pending_accesses(std::size_t num = 1)
        {
            pending_accesses_ += num;
        }

        std::int64_t get_num_stolen_from_pending(bool reset)
        {
            return util::get_and_reset_value(stolen_from_pending_, reset);
        }

        void increment_num_stolen_from_pending(std::size_t num = 1)
        {
            stolen_from_pending_ += num;
        }

        std::int64_t get_num_stolen_from_staged(bool reset)
        {
            return util::get_and_reset_value(stolen_from_staged_, reset);
        }

        void increment_num_stolen_from_staged(std::size_t num = 1)
        {
            stolen_from_staged_ += num;
        }

        std::int64_t get_num_stolen_to_pending(bool reset)
        {
            return util::get_and_reset_value(stolen_to_pending_, reset);
        }

        void increment_num_stolen_to_pending(std::size_t num = 1)
        {
            stolen_to_pending_ += num;
        }

        std::int64_t get_num_stolen_to_staged(bool reset)
        {
            return util::get_and_reset_value(stolen_to_staged_, reset);
        }

        void increment_num_stolen_to_staged(std::size_t num = 1)
        {
            stolen_to_staged_ += num;
        }
#else
        void increment_num_pending_misses(std::size_t num = 1) {}
        void increment_num_pending_accesses(std::size_t num = 1) {}
        void increment_num_stolen_from_pending(std::size_t num = 1) {}
        void increment_num_stolen_from_staged(std::size_t num = 1) {}
        void increment_num_stolen_to_pending(std::size_t num = 1) {}
        void increment_num_stolen_to_staged(std::size_t num = 1) {}
#endif

        ///////////////////////////////////////////////////////////////////////
        // create a new thread and schedule it if the initial state is equal to
        // pending
        void create_thread(thread_init_data& data, thread_id_type* id,
            thread_state_enum initial_state, bool run_now, error_code& ec)
        {
            // thread has not been created yet
            if (id) *id = invalid_thread_id;

            if (run_now)
            {
                threads::thread_id_type thrd;

                // The mutex can not be locked while a new thread is getting
                // created, as it might have that the current HPX thread gets
                // suspended.
                {
                    std::unique_lock<mutex_type> lk(mtx_);

                    create_thread_object(thrd, data, initial_state, lk);

                    // add a new entry in the map for this thread
                    std::pair<thread_map_type::iterator, bool> p =
                        thread_map_.insert(thrd);

                    if (HPX_UNLIKELY(!p.second)) {
                        HPX_THROWS_IF(ec, hpx::out_of_memory,
                            "threadmanager::register_thread",
                            "Couldn't add new thread to the map of threads");
                        return;
                    }
                    ++thread_map_count_;

                    // this thread has to be in the map now
                    HPX_ASSERT(thread_map_.find(thrd.get()) != thread_map_.end());
                    HPX_ASSERT(thrd->get_pool() == &memory_pool_);

                    // push the new thread in the pending queue thread
                    if (initial_state == pending)
                        schedule_thread(thrd.get());

                    // return the thread_id of the newly created thread
                    if (id) *id = std::move(thrd);

                    if (&ec != &throws)
                        ec = make_success_code();
                    return;
                }
            }

            // do not execute the work, but register a task description for
            // later thread creation
            ++new_tasks_count_;

#ifdef HPX_HAVE_THREAD_QUEUE_WAITTIME
            new_tasks_.push(new task_description(
                std::move(data), initial_state,
                util::high_resolution_clock::now()
            ));
#else
            new_tasks_.push(new task_description( //-V106
                std::move(data), initial_state));
#endif
            if (&ec != &throws)
                ec = make_success_code();
        }

        void move_work_items_from(thread_queue *src, std::int64_t count)
        {
            thread_description* trd;
            while (src->work_items_.pop(trd))
            {
                --src->work_items_count_;

#ifdef HPX_HAVE_THREAD_QUEUE_WAITTIME
                if (maintain_queue_wait_times) {
                    std::uint64_t now = util::high_resolution_clock::now();
                    src->work_items_wait_ += now - util::get<1>(*trd);
                    ++src->work_items_wait_count_;
                    util::get<1>(*trd) = now;
                }
#endif

                bool finished = count == ++work_items_count_;
                work_items_.push(trd);
                if (finished)
                    break;
            }
        }

        void move_task_items_from(thread_queue *src,
            std::int64_t count)
        {
            task_description* task;
            while (src->new_tasks_.pop(task))
            {
                --src->new_tasks_count_;

#ifdef HPX_HAVE_THREAD_QUEUE_WAITTIME
                if (maintain_queue_wait_times) {
                    std::int64_t now = util::high_resolution_clock::now();
                    src->new_tasks_wait_ += now - util::get<2>(*task);
                    ++src->new_tasks_wait_count_;
                    util::get<2>(*task) = now;
                }
#endif

                bool finish = count == ++new_tasks_count_;
                if (new_tasks_.push(task))
                {
                    if (finish)
                        break;
                }
                else
                {
                    --new_tasks_count_;
                }
            }
        }

        /// Return the next thread to be executed, return false if non is
        /// available
        bool get_next_thread(threads::thread_data*& thrd,
            bool steal = false) HPX_HOT
        {
#ifdef HPX_HAVE_THREAD_QUEUE_WAITTIME
            thread_description* tdesc;
            if (0 != work_items_count_.load(boost::memory_order_relaxed) &&
                work_items_.pop(tdesc, steal))
            {
                --work_items_count_;

                if (maintain_queue_wait_times) {
                    work_items_wait_ += util::high_resolution_clock::now() -
                        util::get<1>(*tdesc);
                    ++work_items_wait_count_;
                }

                thrd = util::get<0>(*tdesc);
                delete tdesc;

                return true;
            }
#else
            if (0 != work_items_count_.load(boost::memory_order_relaxed) &&
                work_items_.pop(thrd, steal))
            {
                --work_items_count_;
                return true;
            }
#endif
            return false;
        }

        /// Schedule the passed thread
        void schedule_thread(threads::thread_data* thrd, bool other_end = false)
        {
            ++work_items_count_;
#ifdef HPX_HAVE_THREAD_QUEUE_WAITTIME
            work_items_.push(new thread_description(
                thrd, util::high_resolution_clock::now()), other_end);
#else
            work_items_.push(thrd, other_end);
#endif
        }

        /// Destroy the passed thread as it has been terminated
        bool destroy_thread(threads::thread_data* thrd, std::int64_t& busy_count)
        {
            if (thrd->get_pool() == &memory_pool_)
            {
                terminated_items_.push(thrd);

                std::int64_t count = ++terminated_items_count_;
                if (count > HPX_MAX_TERMINATED_THREADS)
                {
                    cleanup_terminated(true);   // clean up all terminated threads
                }
                return true;
            }
            return false;
        }

        ///////////////////////////////////////////////////////////////////////
        /// Return the number of existing threads with the given state.
        std::int64_t get_thread_count(thread_state_enum state = unknown) const
        {
            if (terminated == state)
                return terminated_items_count_;

            if (staged == state)
                return new_tasks_count_;

            if (unknown == state)
                return thread_map_count_ + new_tasks_count_ - terminated_items_count_;

            // acquire lock only if absolutely necessary
            std::lock_guard<mutex_type> lk(mtx_);

            std::int64_t num_threads = 0;
            thread_map_type::const_iterator end = thread_map_.end();
            for (thread_map_type::const_iterator it = thread_map_.begin();
                 it != end; ++it)
            {
                if ((*it)->get_state().state() == state)
                    ++num_threads;
            }
            return num_threads;
        }

        ///////////////////////////////////////////////////////////////////////
        void abort_all_suspended_threads()
        {
            std::lock_guard<mutex_type> lk(mtx_);
            thread_map_type::iterator end =  thread_map_.end();
            for (thread_map_type::iterator it = thread_map_.begin();
                 it != end; ++it)
            {
                if ((*it)->get_state().state() == suspended)
                {
                    (*it)->set_state(pending, wait_abort);
                    schedule_thread((*it).get());
                }
            }
        }

        bool enumerate_threads(
            util::function_nonser<bool(thread_id_type)> const& f,
            thread_state_enum state = unknown) const
        {
            std::uint64_t count = thread_map_count_;
            if (state == terminated)
            {
                count = terminated_items_count_;
            }
            else if (state == staged)
            {
                HPX_THROW_EXCEPTION(bad_parameter,
                    "thread_queue::iterate_threads",
                    "can't iterate over thread ids of staged threads");
                return false;
            }

            std::vector<thread_id_type> ids;
            ids.reserve(count);

            if (state == unknown)
            {
                std::lock_guard<mutex_type> lk(mtx_);
                thread_map_type::const_iterator end =  thread_map_.end();
                for (thread_map_type::const_iterator it = thread_map_.begin();
                     it != end; ++it)
                {
                    ids.push_back(*it);
                }
            }
            else
            {
                std::lock_guard<mutex_type> lk(mtx_);
                thread_map_type::const_iterator end =  thread_map_.end();
                for (thread_map_type::const_iterator it = thread_map_.begin();
                     it != end; ++it)
                {
                    if ((*it)->get_state().state() == state)
                        ids.push_back(*it);
                }
            }

            // now invoke callback function for all matching threads
            for (thread_id_type const& id : ids)
            {
                if (!f(id))
                    return false;       // stop iteration
            }

            return true;
        }

        /// This is a function which gets called periodically by the thread
        /// manager to allow for maintenance tasks to be executed in the
        /// scheduler. Returns true if the OS thread calling this function
        /// has to be terminated (i.e. no more work has to be done).
        inline bool wait_or_add_new(bool running,
            std::int64_t& idle_loop_count, std::size_t& added,
            thread_queue* addfrom_ = nullptr, bool steal = false) HPX_HOT
        {
            // try to generate new threads from task lists, but only if our
            // own list of threads is empty
            if (0 == work_items_count_.load(boost::memory_order_relaxed)) {

                // No obvious work has to be done, so a lock won't hurt too much.
                //
                // We prefer to exit this function (some kind of very short
                // busy waiting) to blocking on this lock. Locking fails either
                // when a thread is currently doing thread maintenance, which
                // means there might be new work, or the thread owning the lock
                // just falls through to the cleanup work below (no work is available)
                // in which case the current thread (which failed to acquire
                // the lock) will just retry to enter this loop.
                std::unique_lock<mutex_type> lk(mtx_, std::try_to_lock);
                if (!lk.owns_lock())
                    return false;            // avoid long wait on lock

                // stop running after all HPX threads have been terminated
                thread_queue* addfrom = addfrom_ ? addfrom_ : this;
                bool added_new = add_new_always(added, addfrom, lk, steal);
                if (!added_new) {
                    // Before exiting each of the OS threads deletes the
                    // remaining terminated HPX threads
                    // REVIEW: Should we be doing this if we are stealing?
                    bool canexit = cleanup_terminated_locked(true);
                    if (!running && canexit) {
                        // we don't have any registered work items anymore
                        //do_some_work();       // notify possibly waiting threads
                        return true;            // terminate scheduling loop
                    }
                    return false;
                }

                cleanup_terminated_locked();
            }
            return false;
        }

        ///////////////////////////////////////////////////////////////////////
        bool dump_suspended_threads(std::size_t num_thread
          , std::int64_t& idle_loop_count, bool running)
        {
#ifndef HPX_HAVE_THREAD_MINIMAL_DEADLOCK_DETECTION
            return false;
#else
            if (minimal_deadlock_detection) {
                std::lock_guard<mutex_type> lk(mtx_);
                return detail::dump_suspended_threads(num_thread, thread_map_
                  , idle_loop_count, running);
            }
            return false;
#endif
        }

        ///////////////////////////////////////////////////////////////////////
        void on_start_thread(std::size_t num_thread) {}
        void on_stop_thread(std::size_t num_thread) {}
        void on_error(std::size_t num_thread, boost::exception_ptr const& e) {}

    private:
        mutable mutex_type mtx_;                    ///< mutex protecting the members

        thread_map_type thread_map_;
        ///< mapping of thread id's to HPX-threads
        boost::atomic<std::int64_t> thread_map_count_;
        ///< overall count of work items

        work_items_type work_items_;
        ///< list of active work items
        boost::atomic<std::int64_t> work_items_count_;
        ///< count of active work items

#ifdef HPX_HAVE_THREAD_QUEUE_WAITTIME
        boost::atomic<std::int64_t> work_items_wait_;
        ///< overall wait time of work items
        boost::atomic<std::int64_t> work_items_wait_count_;
        ///< overall number of work items in queue
#endif
        terminated_items_type terminated_items_;     ///< list of terminated threads
        boost::atomic<std::int64_t> terminated_items_count_;
        ///< count of terminated items

        std::size_t max_count_;
        ///< maximum number of existing HPX-threads
        task_items_type new_tasks_;
        ///< list of new tasks to run

        boost::atomic<std::int64_t> new_tasks_count_;
        ///< count of new tasks to run
#ifdef HPX_HAVE_THREAD_QUEUE_WAITTIME
        boost::atomic<std::int64_t> new_tasks_wait_;
        ///< overall wait time of new tasks
        boost::atomic<std::int64_t> new_tasks_wait_count_;
        ///< overall number tasks waited
#endif

        threads::thread_pool memory_pool_;          ///< OS thread local memory pools for
                                                    ///< HPX-threads

        std::list<thread_id_type> thread_heap_small_;
        std::list<thread_id_type> thread_heap_medium_;
        std::list<thread_id_type> thread_heap_large_;
        std::list<thread_id_type> thread_heap_huge_;

#ifdef HPX_HAVE_THREAD_CREATION_AND_CLEANUP_RATES
        std::uint64_t add_new_time_;
        std::uint64_t cleanup_terminated_time_;
#endif

#ifdef HPX_HAVE_THREAD_STEALING_COUNTS
        // # of times our associated worker-thread couldn't find work in work_items
        boost::atomic<std::int64_t> pending_misses_;

        // # of times our associated worker-thread looked for work in work_items
        boost::atomic<std::int64_t> pending_accesses_;

        boost::atomic<std::int64_t> stolen_from_pending_;
        ///< count of work_items stolen from this queue
        boost::atomic<std::int64_t> stolen_from_staged_;
        ///< count of new_tasks stolen from this queue
        boost::atomic<std::int64_t> stolen_to_pending_;
        ///< count of work_items stolen to this queue from other queues
        boost::atomic<std::int64_t> stolen_to_staged_;
        ///< count of new_tasks stolen to this queue from other queues
#endif

        util::block_profiler<add_new_tag> add_new_logger_;
    };
}}}

#endif



Line	% of fetches	Source
1		// Copyright (c) 2007-2016 Hartmut Kaiser
2		// Copyright (c) 2011 Bryce Lelbach
3		//
4		// Distributed under the Boost Software License, Version 1.0. (See accompanying
5		// file LICENSE_1_0.txt or copy at http://www.boost.org/LICENSE_1_0.txt)
6
7		#if !defined(HPX_THREADMANAGER_THREAD_QUEUE_AUG_25_2009_0132PM)
8		#define HPX_THREADMANAGER_THREAD_QUEUE_AUG_25_2009_0132PM
9
10		#include <hpx/config.hpp>
11		#include <hpx/error_code.hpp>
12		#include <hpx/runtime/threads/policies/lockfree_queue_backends.hpp>
13		#include <hpx/runtime/threads/policies/queue_helpers.hpp>
14		#include <hpx/runtime/threads/thread_data.hpp>
15		#include <hpx/throw_exception.hpp>
16		#include <hpx/util/assert.hpp>
17		#include <hpx/util/block_profiler.hpp>
18		#include <hpx/util/function.hpp>
19		#include <hpx/util/get_and_reset_value.hpp>
20		#include <hpx/util/high_resolution_clock.hpp>
21		#include <hpx/util/unlock_guard.hpp>
22
23		#ifdef HPX_HAVE_THREAD_CREATION_AND_CLEANUP_RATES
24		# include <hpx/util/tick_counter.hpp>
25		#endif
26
27		#include <boost/atomic.hpp>
28		#include <boost/exception_ptr.hpp>
29		#include <boost/thread/condition.hpp>
30		#include <boost/thread/mutex.hpp>
31
32		#include <cstddef>
33		#include <cstdint>
34		#include <functional>
35		#include <list>
36		#include <map>
37		#include <memory>
38		#include <mutex>
39		#include <unordered_set>
40		#include <utility>
41		#include <vector>
42
43		///////////////////////////////////////////////////////////////////////////////
44		namespace std
45		{
46		template <>
47		struct hash< ::hpx::threads::thread_id_type>
48		{
49		typedef ::hpx::threads::thread_id_type argument_type;
50		typedef std::size_t result_type;
51
52		std::size_t operator()(::hpx::threads::thread_id_type const& v) const
53		{
54		std::hash<std::size_t> hasher_;
55		return hasher_(reinterpret_cast<std::size_t>(v.get()));
56		}
57		};
58		}
59
60		///////////////////////////////////////////////////////////////////////////////
61		namespace hpx { namespace threads { namespace policies
62		{
63		#ifdef HPX_HAVE_THREAD_QUEUE_WAITTIME
64		///////////////////////////////////////////////////////////////////////////
65		// We control whether to collect queue wait times using this global bool.
66		// It will be set by any of the related performance counters. Once set it
67		// stays set, thus no race conditions will occur.
68		extern bool maintain_queue_wait_times;
69		#endif
70		#ifdef HPX_HAVE_THREAD_MINIMAL_DEADLOCK_DETECTION
71		///////////////////////////////////////////////////////////////////////////
72		// We globally control whether to do minimal deadlock detection using this
73		// global bool variable. It will be set once by the runtime configuration
74		// startup code
75		extern bool minimal_deadlock_detection;
76		#endif
77
78		///////////////////////////////////////////////////////////////////////////
79		// // Queue back-end interface:
80		//
81		// template <typename T>
82		// struct queue_backend
83		// {
84		// typedef ... container_type;
85		// typedef ... value_type;
86		// typedef ... reference;
87		// typedef ... const_reference;
88		// typedef ... size_type;
89		//
90		// queue_backend(
91		// size_type initial_size = ...
92		// , size_type num_thread = ...
93		// );
94		//
95		// bool push(const_reference val);
96		//
97		// bool pop(reference val, bool steal = true);
98		//
99		// bool empty();
100		// };
101		//
102		// struct queue_policy
103		// {
104		// template <typename T>
105		// struct apply
106		// {
107		// typedef ... type;
108		// };
109		// };
110		template <typename Mutex = boost::mutex,
111		typename PendingQueuing = lockfree_lifo,
112		typename StagedQueuing = lockfree_lifo,
113		typename TerminatedQueuing = lockfree_fifo>
114		class thread_queue
115		{
116		private:
117		// we use a simple mutex to protect the data members for now
118		typedef Mutex mutex_type;
119
120		// Add this number of threads to the work items queue each time the
121		// function \a add_new() is called if the queue is empty.
122		enum {
123		min_add_new_count = 10,
124		max_add_new_count = 10,
125		max_delete_count = 1000
126		};
127
128		// this is the type of a map holding all threads (except depleted ones)
129		typedef std::unordered_set<thread_id_type> thread_map_type;
130
131		#ifdef HPX_HAVE_THREAD_QUEUE_WAITTIME
132		typedef
133		util::tuple<thread_init_data, thread_state_enum, std::uint64_t>
134		task_description;
135		#else
136		typedef util::tuple<thread_init_data, thread_state_enum> task_description;
137		#endif
138
139		#ifdef HPX_HAVE_THREAD_QUEUE_WAITTIME
140		typedef util::tuple<thread_data*, std::uint64_t> thread_description;
141		#else
142		typedef thread_data thread_description;
143		#endif
144
145		typedef typename PendingQueuing::template
146		apply<thread_description*>::type work_items_type;
147
148		typedef typename StagedQueuing::template
149		apply<task_description*>::type task_items_type;
150
151		typedef typename TerminatedQueuing::template
152		apply<thread_data*>::type terminated_items_type;
153
154		protected:
155		template <typename Lock>
156		void create_thread_object(threads::thread_id_type& thrd,
157		threads::thread_init_data& data, thread_state_enum state, Lock& lk)
158		{
159		HPX_ASSERT(lk.owns_lock());
160		HPX_ASSERT(data.stacksize != 0);
161
162		std::ptrdiff_t stacksize = data.stacksize;
163
164		std::list<thread_id_type>* heap = nullptr;
165
166		if (stacksize == get_stack_size(thread_stacksize_small))
167		{
168		heap = &thread_heap_small_;
169		}
170		else if (stacksize == get_stack_size(thread_stacksize_medium))
171		{
172		heap = &thread_heap_medium_;
173		}
174		else if (stacksize == get_stack_size(thread_stacksize_large))
175		{
176		heap = &thread_heap_large_;
177		}
178		else if (stacksize == get_stack_size(thread_stacksize_huge))
179		{
180		heap = &thread_heap_huge_;
181		}
182		else {
183		switch(stacksize) {
184		case thread_stacksize_small:
185		heap = &thread_heap_small_;
186		break;
187
188		case thread_stacksize_medium:
189		heap = &thread_heap_medium_;
190		break;
191
192		case thread_stacksize_large:
193		heap = &thread_heap_large_;
194		break;
195
196		case thread_stacksize_huge:
197		heap = &thread_heap_huge_;
198		break;
199
200		default:
201		break;
202		}
203		}
204		HPX_ASSERT(heap);
205
206		// Check for an unused thread object.
207		if (!heap->empty())
208		{
209		// Take ownership of the thread object and rebind it.
210		thrd = heap->front();
211		heap->pop_front();
212		thrd->rebind(data,
213		state == pending_do_not_schedule ? pending : state);
214		}
215
216		else
217		{
218		hpx::util::unlock_guard<Lock> ull(lk);
219
220		// Allocate a new thread object.
221		thrd = threads::thread_data::create(
222		data, memory_pool_,
223		state == pending_do_not_schedule ? pending : state);
224		}
225		}
226
227		///////////////////////////////////////////////////////////////////////
228		// add new threads if there is some amount of work available
229		std::size_t add_new(std::int64_t add_count, thread_queue* addfrom,
230		std::unique_lock<mutex_type> &lk, bool steal = false)
231		{
232		HPX_ASSERT(lk.owns_lock());
233
234		if (HPX_UNLIKELY(0 == add_count))
235		return 0;
236
237		std::size_t added = 0;
238		task_description* task = nullptr;
239		while (add_count-- && addfrom->new_tasks_.pop(task, steal))
240		{
241		#ifdef HPX_HAVE_THREAD_QUEUE_WAITTIME
242		if (maintain_queue_wait_times) {
243		addfrom->new_tasks_wait_ +=
244		util::high_resolution_clock::now() - util::get<2>(*task);
245		++addfrom->new_tasks_wait_count_;
246		}
247		#endif
248		--addfrom->new_tasks_count_;
249
250		// measure thread creation time
251		util::block_profiler_wrapper<add_new_tag> bp(add_new_logger_);
252
253		// create the new thread
254		threads::thread_init_data& data = util::get<0>(*task);
255		thread_state_enum state = util::get<1>(*task);
256		threads::thread_id_type thrd;
257
258		create_thread_object(thrd, data, state, lk);
259
260		delete task;
261
262		// add the new entry to the map of all threads
263		std::pair<thread_map_type::iterator, bool> p =
264		thread_map_.insert(thrd);
265
266		if (HPX_UNLIKELY(!p.second)) {
267		HPX_THROW_EXCEPTION(hpx::out_of_memory,
268		"threadmanager::add_new",
269		"Couldn't add new thread to the thread map");
270		return 0;
271		}
272		++thread_map_count_;
273
274		// only insert the thread into the work-items queue if it is in
275		// pending state
276		if (state == pending) {
277		// pushing the new thread into the pending queue of the
278		// specified thread_queue
279		++added;
280		schedule_thread(thrd.get());
281		}
282
283		// this thread has to be in the map now
284		HPX_ASSERT(thread_map_.find(thrd.get()) != thread_map_.end());
285		HPX_ASSERT(thrd->get_pool() == &memory_pool_);
286		}
287
288		if (added) {
289		LTM_(debug) << "add_new: added " << added << " tasks to queues"; //-V128
290		}
291		return added;
292		}
293
294		///////////////////////////////////////////////////////////////////////
295		bool add_new_if_possible(std::size_t& added, thread_queue* addfrom,
296		std::unique_lock<mutex_type> &lk, bool steal = false)
297		{
298		HPX_ASSERT(lk.owns_lock());
299
300		#ifdef HPX_HAVE_THREAD_CREATION_AND_CLEANUP_RATES
301		util::tick_counter tc(add_new_time_);
302		#endif
303
304		if (0 == addfrom->new_tasks_count_.load(boost::memory_order_relaxed))
305		return false;
306
307		// create new threads from pending tasks (if appropriate)
308		std::int64_t add_count = -1; // default is no constraint
309
310		// if the map doesn't hold max_count threads yet add some
311		// FIXME: why do we have this test? can max_count_ ever be zero?
312		if (HPX_LIKELY(max_count_)) {
313		std::size_t count = thread_map_.size();
314		if (max_count_ >= count + min_add_new_count) { //-V104
315		HPX_ASSERT(max_count_ - count <
316		static_cast<std::size_t>((std::numeric_limits
317		<std::int64_t>::max)()));
318		add_count = static_cast<std::int64_t>(max_count_ - count);
319		if (add_count < min_add_new_count)
320		add_count = min_add_new_count;
321		}
322		else {
323		return false;
324		}
325		}
326
327		std::size_t addednew = add_new(add_count, addfrom, lk, steal);
328		added += addednew;
329		return addednew != 0;
330		}
331
332		///////////////////////////////////////////////////////////////////////
333		bool add_new_always(std::size_t& added, thread_queue* addfrom,
334		std::unique_lock<mutex_type> &lk, bool steal = false)
335		{
336		HPX_ASSERT(lk.owns_lock());
337
338		#ifdef HPX_HAVE_THREAD_CREATION_AND_CLEANUP_RATES
339		util::tick_counter tc(add_new_time_);
340		#endif
341
342		if (0 == addfrom->new_tasks_count_.load(boost::memory_order_relaxed))
343		return false;
344
345		// create new threads from pending tasks (if appropriate)
346		std::int64_t add_count = -1; // default is no constraint
347
348		// if we are desperate (no work in the queues), add some even if the
349		// map holds more than max_count
350		if (HPX_LIKELY(max_count_)) {
351		std::size_t count = thread_map_.size();
352		if (max_count_ >= count + min_add_new_count) { //-V104
353		HPX_ASSERT(max_count_ - count <
354		static_cast<std::size_t>((std::numeric_limits
355		<std::int64_t>::max)()));
356		add_count = static_cast<std::int64_t>(max_count_ - count);
357		if (add_count < min_add_new_count)
358		add_count = min_add_new_count;
359		if (add_count > max_add_new_count)
360		add_count = max_add_new_count;
361		}
362		else if (work_items_.empty()) {
363		add_count = min_add_new_count; // add this number of threads
364		max_count_ += min_add_new_count; // increase max_count //-V101
365		}
366		else {
367		return false;
368		}
369		}
370
371		std::size_t addednew = add_new(add_count, addfrom, lk, steal);
372		added += addednew;
373		return addednew != 0;
374		}
375
376		void recycle_thread(thread_id_type thrd)
377		{
378		std::ptrdiff_t stacksize = thrd->get_stack_size();
379
380		if (stacksize == get_stack_size(thread_stacksize_small))
381		{
382		thread_heap_small_.push_front(thrd);
383		}
384		else if (stacksize == get_stack_size(thread_stacksize_medium))
385		{
386		thread_heap_medium_.push_front(thrd);
387		}
388		else if (stacksize == get_stack_size(thread_stacksize_large))
389		{
390		thread_heap_large_.push_front(thrd);
391		}
392		else if (stacksize == get_stack_size(thread_stacksize_huge))
393		{
394		thread_heap_huge_.push_front(thrd);
395		}
396		else
397		{
398		switch(stacksize) {
399		case thread_stacksize_small:
400		thread_heap_small_.push_front(thrd);
401		break;
402
403		case thread_stacksize_medium:
404		thread_heap_medium_.push_front(thrd);
405		break;
406
407		case thread_stacksize_large:
408		thread_heap_large_.push_front(thrd);
409		break;
410
411		case thread_stacksize_huge:
412		thread_heap_huge_.push_front(thrd);
413		break;
414
415		default:
416		HPX_ASSERT(false);
417		break;
418		}
419		}
420		}
421
422		public:
423		/// This function makes sure all threads which are marked for deletion
424		/// (state is terminated) are properly destroyed.
425		///
426		/// This returns 'true' if there are no more terminated threads waiting
427		/// to be deleted.
428		bool cleanup_terminated_locked_helper(bool delete_all = false)
429		{
430		#ifdef HPX_HAVE_THREAD_CREATION_AND_CLEANUP_RATES
431		util::tick_counter tc(cleanup_terminated_time_);
432		#endif
433
434		if (terminated_items_count_ == 0 && thread_map_.empty())
435		return true;
436
437		if (delete_all) {
438		// delete all threads
439		thread_data* todelete;
440		while (terminated_items_.pop(todelete))
441		{
442		--terminated_items_count_;
443
444		// this thread has to be in this map
445		HPX_ASSERT(thread_map_.find(todelete) != thread_map_.end());
446
447		bool deleted = thread_map_.erase(todelete) != 0;
448		HPX_ASSERT(deleted);
449		if (deleted) {
450		--thread_map_count_;
451		HPX_ASSERT(thread_map_count_ >= 0);
452		}
453		}
454		}
455		else {
456		// delete only this many threads
457		std::int64_t delete_count =
458		(std::max)(
459		static_cast<std::int64_t>(terminated_items_count_ / 10),
460		static_cast<std::int64_t>(max_delete_count));
461
462		thread_data* todelete;
463		while (delete_count && terminated_items_.pop(todelete))
464		{
465		--terminated_items_count_;
466
467		thread_map_type::iterator it = thread_map_.find(todelete);
468
469		// this thread has to be in this map
470		HPX_ASSERT(it != thread_map_.end());
471
472		recycle_thread(*it);
473
474		thread_map_.erase(it);
475		--thread_map_count_;
476		HPX_ASSERT(thread_map_count_ >= 0);
477
478		--delete_count;
479		}
480		}
481		return terminated_items_count_ == 0;
482		}
483
484		bool cleanup_terminated_locked(bool delete_all = false)
485		{
486		return cleanup_terminated_locked_helper(delete_all) &&
487		thread_map_.empty();
488		}
489
490		public:
491		bool cleanup_terminated(bool delete_all = false)
492		{
493		if (terminated_items_count_ == 0)
494		return thread_map_count_ == 0;
495
496		if (delete_all) {
497		// do not lock mutex while deleting all threads, do it piece-wise
498		bool thread_map_is_empty = false;
499		while (true)
500		{