job/queue: rework locking for reliability

This commit is contained in:
Danny Robson 2018-03-15 15:21:05 +11:00
parent 0c824919de
commit f3f3666877
3 changed files with 189 additions and 115 deletions

View File

@ -11,11 +11,13 @@
* See the License for the specific language governing permissions and
* limitations under the License.
*
* Copyright 2017 Danny Robson <danny@nerdcruft.net>
* Copyright 2018 Danny Robson <danny@nerdcruft.net>
*/
#include "./queue.hpp"
#include "../raii.hpp"
#include <iostream>
using util::job::queue;
@ -29,56 +31,57 @@ queue::queue ():
//-----------------------------------------------------------------------------
queue::queue (unsigned thread_count):
m_loop ([] (store &s) {
args obj;
while (true) {
// acquire the work lock and see if we need to quit, continue,
// or sleep
std::unique_lock<std::mutex> lk (s.mutex);
if (s.pending.empty ()) {
s.cv.wait (lk, [&] () {
return s.stopping.load () || !s.pending.empty ();
});
}
if (s.stopping.load ())
break;
// extract the arguments and forward them to the functor
obj = std::move (s.pending.front ());
s.pending.pop_front ();
lk.unlock ();
s.cv.notify_one ();
obj.function (obj);
}
}),
m_tasks {
{}, util::pool<task> {4096}
},
m_pending (0),
m_threads (thread_count)
{
for (auto &t: m_threads)
t = std::thread (m_loop, std::ref (m_store));
t = std::thread (&queue::loop, this);
}
//-----------------------------------------------------------------------------
queue::~queue ()
{
// tell everyone we want to quit
{
std::lock_guard<std::mutex> lk {m_store.mutex};
m_store.stopping.store (true);
}
m_store.cv.notify_all ();
m_stopping = true;
// raise the semaphore enough times to resume all the worker threads
for (size_t i = 0; i < m_threads.size (); ++i)
m_pending.release ();
// wait for everyone to tidy up. perhaps we'd like to use a timeout, but
// if things deadlock then it's the users fault currently.
std::for_each (
std::begin (m_threads),
std::end (m_threads),
[] (auto &t)
{
for (auto &t: m_threads)
t.join ();
});
}
///////////////////////////////////////////////////////////////////////////////
void
queue::loop ()
{
while (true) {
m_pending.acquire ();
if (m_stopping)
return;
util::scoped_counter running_count (m_running);
CHECK (!m_tasks.pending->empty ());
auto todo = [this] () {
auto obj = m_tasks.pending.acquire ();
auto res = obj->front ();
obj->pop_front ();
return res;
} ();
util::scoped_function cleanup ([&, this] () {
m_tasks.store.destroy (todo);
});
todo->function (*todo);
}
}

View File

@ -17,6 +17,15 @@
#ifndef CRUFT_UTIL_JOB_QUEUE_HPP
#define CRUFT_UTIL_JOB_QUEUE_HPP
#include "../pool.hpp"
#include "../tuple.hpp"
#include "ticketlock.hpp"
#include "semaphore.hpp"
#include "flag.hpp"
#include "monitor.hpp"
#include <array>
#include <deque>
#include <thread>
@ -28,6 +37,8 @@
#include <mutex>
#include <condition_variable>
#include <iostream>
namespace util::job {
class queue {
public:
@ -35,66 +46,83 @@ namespace util::job {
explicit queue (unsigned thread_count);
~queue ();
using cookie = int;
queue (const queue&) = delete;
queue (queue&&) = delete;
queue& operator= (const queue&) = delete;
queue& operator= (queue&&) = delete;
auto parallelism (void) const { return m_threads.size (); }
struct task;
struct [[nodiscard]] cookie {
~cookie ()
{
if (data) {
data->done.wait ();
data->references.release ();
}
}
task&
operator-> (void)
{
return *data;
}
cookie (task &_data, queue &_runner):
data (&_data),
runner (_runner)
{ ; }
cookie (cookie &&rhs):
data (nullptr),
runner (rhs.runner)
{
std::swap (data, rhs.data);
}
cookie& operator= (cookie&&) = delete;
cookie (const cookie&) = delete;
cookie& operator= (const cookie&) = delete;
task *data;
queue &runner;
};
template <class Function, typename ...Args>
cookie
submit (cookie &parent, Function&&, Args&&...);
submit (task &parent, Function&&, Args&&...);
/// record a functor and a set of parameters to execute at some point
/// in the future by an arbitrary available thread.
template <class Function, typename ...Args>
cookie
submit (Function &&func, Args &&...params)
submit (Function &&func, Args &&...args)
{
{
std::unique_lock<std::mutex> lk (m_store.mutex);
m_store.pending.emplace_back (
std::forward<Function> (func),
std::forward<Args> (params)...
);
}
CHECK (!m_stopping);
m_store.cv.notify_one ();
auto ptr = m_tasks.store.construct (
std::forward<Function> (func),
std::forward<Args> (args)...
);
// TODO: return a useful identifier to allow waiting
return 0;
}
m_tasks.pending->push_back (ptr);
void wait (cookie);
m_pending.release ();
// HACK: this doesn't actually implement a proper barrier and may not
// even guarantee that all jobs are flushed. it's provided to make
// some amount of testing slightly more convenient by draining most
// of the queue on demand.
void
flush (void)
{
// setup a cv and completion flag. this is a poor man's barrier.
std::mutex m;
std::unique_lock<std::mutex> lk (m);
std::condition_variable cv;
std::atomic<bool> done = false;
// submit a job to the back of the queue that sets the done flag
// and wakes us back up again.
submit ([&] (void) {
{
std::lock_guard<std::mutex> _{m};
done.store (true);
}
cv.notify_one ();
});
// wait until the flag is set then exit.
do {
cv.wait (lk, [&] () { return done.load (); });
} while (!done.load ());
return cookie (*ptr, *this);
}
private:
// block until all jobs currently queued have been started
void flush (void);
// block until there are no more jobs queued or executing
void finish (void);
/// stores a functor and associated arguments in a fixed size buffer
/// for later execution.
///
@ -107,46 +135,77 @@ namespace util::job {
/// the user supplied functor is wrapped with our own that unpacks and
/// forwards the arguments from the data buffer. this function must
/// be passed a copy of the current arg object as the only argument.
struct args {
args () = default;
struct task {
task () = default;
template <class Function, typename ...Args>
args (Function &&func, Args&&...params)
~task ()
{
using tuple_t = std::tuple<std::decay_t<Args>...>;
static_assert ((std::is_trivial_v<std::decay_t<decltype(params)>> && ...));
done.notify ();
references.acquire ();
}
task (const task&) = delete;
task (task&&) = delete;
task& operator= (const task&) = delete;
task& operator= (task&&) = delete;
template <class FunctionT, typename ...Args>
task (FunctionT &&func, Args&&...params)
{
using tuple_t = std::tuple<std::remove_reference_t <Args>...>;
static_assert ((
(
std::is_trivially_copyable_v<Args> ||
std::is_scalar_v<std::remove_reference_t<Args>> ||
is_same_template_template_v<std::reference_wrapper, Args>
) && ...)
);
static_assert (sizeof (tuple_t) <= sizeof data);
union {
decltype(data) *byte_ptr;
tuple_t *args_ptr;
};
byte_ptr = &data;
*args_ptr = std::make_tuple (params...);
tuple_t &punned = *reinterpret_cast<tuple_t*> (&data);
punned = tuple_t (params...);
function = [func] (args &base) {
std::apply (func, *reinterpret_cast<tuple_t*> (&base.data));
};
};
if constexpr (std::is_function_v<std::remove_reference_t<FunctionT>>) {
function = [f=std::ref(func)] (task &base) {
std::apply (f, *reinterpret_cast<tuple_t*> (&base.data));
};
} else {
function = [func] (task &base) {
std::apply (func, *reinterpret_cast<tuple_t*> (&base.data));
};
}
}
void acquire (void) { --references; }
void release (void) { ++references; }
// GCC: switch to hardware_destructive_interference_size when it
// becomes available in libstdc++. Until then we use a sensible
// guess.
std::array<char,64> data;
std::function<void(args&)> function;
std::function<void(task&)> function;
semaphore references = 0;
flag done;
};
struct store {
std::atomic<bool> stopping = false;
std::deque<args> pending;
private:
void loop ();
std::condition_variable cv;
std::mutex mutex;
};
std::atomic<bool> m_stopping = false;
std::atomic<int> m_running = 0;
struct {
monitor<
std::deque<task*>,
ticketlock
> pending;
pool<task> store;
} m_tasks;
semaphore m_pending;
store m_store;
std::function<void(store&)> m_loop;
std::vector<std::thread> m_threads;
};
}

View File

@ -1,8 +1,12 @@
///////////////////////////////////////////////////////////////////////////////
#include "job/queue.hpp"
#include "tap.hpp"
#include <unistd.h>
#include <chrono>
#include <iostream>
///////////////////////////////////////////////////////////////////////////////
int
main (void)
{
@ -13,19 +17,27 @@ main (void)
// executed, and finished. it's not definitive, but executing this many
// items this many times seems reasonably reliable in exposing deadlocks.
bool success = true;
constexpr int OUTTER = 16;
constexpr int INNER = 1024;
constexpr int OUTTER = 1;
constexpr int INNER = 1;
for (auto i = 0; i < OUTTER && success; ++i) {
std::atomic<int> count = 0;
{
util::job::queue q {};
for (int j = 0; j < INNER; ++j)
q.submit ([&count] () noexcept { ++count; });
q.flush ();
util::job::queue q {1};
std::vector<util::job::queue::cookie> cookies;
for (int j = 0; j < INNER; ++j) {
cookies.push_back (
q.submit ([&count] (int sleep_for) noexcept {
std::this_thread::sleep_for (std::chrono::microseconds (sleep_for % 25));
++count;
}, j)
);
}
}
std::cout << count << '\n';
success = count == INNER && success;
}