[tor-commits] [tor/master] Documentation for new workqueue and condition and locking stuff
nickm at torproject.org
nickm at torproject.org
Wed Jan 21 19:50:31 UTC 2015
commit b2db3fb4627c8bd06489334f69b6d36d60fb418d
Author: Nick Mathewson <nickm at torproject.org>
Date: Wed Sep 25 11:05:27 2013 -0400
Documentation for new workqueue and condition and locking stuff
---
src/common/compat_pthreads.c | 11 ++-
src/common/compat_threads.c | 39 ++++++++-
src/common/compat_threads.h | 12 ++-
src/common/workqueue.c | 178 +++++++++++++++++++++++++++++++++---------
src/common/workqueue.h | 14 +++-
5 files changed, 205 insertions(+), 49 deletions(-)
diff --git a/src/common/compat_pthreads.c b/src/common/compat_pthreads.c
index 59b54a6..a2e4065 100644
--- a/src/common/compat_pthreads.c
+++ b/src/common/compat_pthreads.c
@@ -164,6 +164,7 @@ tor_get_thread_id(void)
/* Conditions. */
+/** Initialize an already-allocated condition variable. */
int
tor_cond_init(tor_cond_t *cond)
{
@@ -173,7 +174,9 @@ tor_cond_init(tor_cond_t *cond)
}
return 0;
}
-/** Release all resources held by <b>cond</b>. */
+
+/** Release all resources held by <b>cond</b>, but do not free <b>cond</b>
+ * itself. */
void
tor_cond_uninit(tor_cond_t *cond)
{
@@ -183,7 +186,11 @@ tor_cond_uninit(tor_cond_t *cond)
}
}
/** Wait until one of the tor_cond_signal functions is called on <b>cond</b>.
- * All waiters on the condition must wait holding the same <b>mutex</b>.
+ * (If <b>tv</b> is set, and that amount of time passes with no signal to
+ * <b>cond</b>, return anyway. All waiters on the condition must wait holding
+ * the same <b>mutex</b>. All signallers should hold that mutex. The mutex
+ * needs to have been allocated with tor_mutex_init_for_cond().
+ *
* Returns 0 on success, -1 on failure, 1 on timeout. */
int
tor_cond_wait(tor_cond_t *cond, tor_mutex_t *mutex, const struct timeval *tv)
diff --git a/src/common/compat_threads.c b/src/common/compat_threads.c
index 98bdbbc..024c627 100644
--- a/src/common/compat_threads.c
+++ b/src/common/compat_threads.c
@@ -40,6 +40,7 @@ tor_mutex_free(tor_mutex_t *m)
tor_free(m);
}
+/** Allocate and return a new condition variable. */
tor_cond_t *
tor_cond_new(void)
{
@@ -48,6 +49,8 @@ tor_cond_new(void)
tor_free(cond);
return cond;
}
+
+/** Free all storage held in <b>c</b>. */
void
tor_cond_free(tor_cond_t *c)
{
@@ -140,13 +143,16 @@ sock_drain(tor_socket_t fd)
return 0;
}
-/** Allocate a new set of alert sockets. DOCDOC */
+/** Allocate a new set of alert sockets, and set the appropriate function
+ * pointers, in <b>socks_out</b>. */
int
alert_sockets_create(alert_sockets_t *socks_out)
{
tor_socket_t socks[2];
#ifdef HAVE_EVENTFD
+ /* First, we try the Linux eventfd() syscall. This gives a 64-bit counter
+ * associated with a single file descriptor. */
#if defined(EFD_CLOEXEC) && defined(EFD_NONBLOCK)
socks[0] = eventfd(0, EFD_CLOEXEC|EFD_NONBLOCK);
#else
@@ -171,6 +177,8 @@ alert_sockets_create(alert_sockets_t *socks_out)
#endif
#ifdef HAVE_PIPE2
+ /* Now we're going to try pipes. First type the pipe2() syscall, if we
+ * have it, so we can save some calls... */
if (pipe2(socks, O_NONBLOCK|O_CLOEXEC) == 0) {
socks_out->read_fd = socks[0];
socks_out->write_fd = socks[1];
@@ -181,6 +189,8 @@ alert_sockets_create(alert_sockets_t *socks_out)
#endif
#ifdef HAVE_PIPE
+ /* Now try the regular pipe() syscall. Pipes have a bit lower overhead than
+ * socketpairs, fwict. */
if (pipe(socks) == 0) {
if (fcntl(socks[0], F_SETFD, FD_CLOEXEC) < 0 ||
fcntl(socks[1], F_SETFD, FD_CLOEXEC) < 0 ||
@@ -198,12 +208,35 @@ alert_sockets_create(alert_sockets_t *socks_out)
}
#endif
+ /* If nothing else worked, fall back on socketpair(). */
if (tor_socketpair(AF_UNIX, SOCK_STREAM, 0, socks) == 0) {
- set_socket_nonblocking(socks[0]);
- set_socket_nonblocking(socks[1]);
+ if (set_socket_nonblocking(socks[0]) < 0 ||
+ set_socket_nonblocking(socks[1])) {
+ tor_close_socket(socks[0]);
+ tor_close_socket(socks[1]);
+ return -1;
+ }
+ socks_out->read_fd = socks[0];
+ socks_out->write_fd = socks[1];
socks_out->alert_fn = sock_alert;
socks_out->drain_fn = sock_drain;
return 0;
}
return -1;
}
+
+/** Close the sockets in <b>socks</b>. */
+void
+alert_sockets_close(alert_sockets_t *socks)
+{
+ if (socks->alert_fn == sock_alert) {
+ /* they are sockets. */
+ tor_close_socket(socks->read_fd);
+ tor_close_socket(socks->write_fd);
+ } else {
+ close(socks->read_fd);
+ if (socks->write_fd != socks->read_fd)
+ close(socks->write_fd);
+ }
+ socks->read_fd = socks->write_fd = -1;
+}
diff --git a/src/common/compat_threads.h b/src/common/compat_threads.h
index b053136..9070f13 100644
--- a/src/common/compat_threads.h
+++ b/src/common/compat_threads.h
@@ -82,15 +82,23 @@ int tor_cond_wait(tor_cond_t *cond, tor_mutex_t *mutex,
void tor_cond_signal_one(tor_cond_t *cond);
void tor_cond_signal_all(tor_cond_t *cond);
-/** DOCDOC */
+/** Helper type used to manage waking up the main thread while it's in
+ * the libevent main loop. Used by the work queue code. */
typedef struct alert_sockets_s {
- /*XXX needs a better name */
+ /* XXXX This structure needs a better name. */
+ /** Socket that the main thread should listen for EV_READ events on.
+ * Note that this socket may be a regular fd on a non-Windows platform.
+ */
tor_socket_t read_fd;
+ /** Socket to use when alerting the main thread. */
tor_socket_t write_fd;
+ /** Function to alert the main thread */
int (*alert_fn)(tor_socket_t write_fd);
+ /** Function to make the main thread no longer alerted. */
int (*drain_fn)(tor_socket_t read_fd);
} alert_sockets_t;
int alert_sockets_create(alert_sockets_t *socks_out);
+void alert_sockets_close(alert_sockets_t *socks);
#endif
diff --git a/src/common/workqueue.c b/src/common/workqueue.c
index c4b64de..e07787b 100644
--- a/src/common/workqueue.c
+++ b/src/common/workqueue.c
@@ -9,67 +9,84 @@
#include "tor_queue.h"
#include "torlog.h"
-/*
- design:
-
- each thread has its own queue, try to keep at least elements min..max cycles
- worth of work on each queue.
-
-keep array of threads; round-robin between them.
-
- When out of work, work-steal.
-
- alert threads with condition variables.
+struct threadpool_s {
+ /** An array of pointers to workerthread_t: one for each running worker
+ * thread. */
+ struct workerthread_s **threads;
+ /** Index of the next thread that we'll give work to.*/
+ int next_for_work;
- alert main thread with fd, since it's libevent.
+ /** Number of elements in threads. */
+ int n_threads;
+ /** Mutex to protect all the above fields. */
+ tor_mutex_t lock;
+ /** A reply queue to use when constructing new threads. */
+ replyqueue_t *reply_queue;
- */
+ /** Functions used to allocate and free thread state. */
+ void *(*new_thread_state_fn)(void*);
+ void (*free_thread_state_fn)(void*);
+ void *new_thread_state_arg;
+};
struct workqueue_entry_s {
+ /** The next workqueue_entry_t that's pending on the same thread or
+ * reply queue. */
TOR_TAILQ_ENTRY(workqueue_entry_s) next_work;
+ /** The thread to which this workqueue_entry_t was assigned. This field
+ * is set when the workqueue_entry_t is created, and won't be cleared until
+ * after it's handled in the main thread. */
struct workerthread_s *on_thread;
+ /** True iff this entry is waiting for a worker to start processing it. */
uint8_t pending;
+ /** Function to run in the worker thread. */
int (*fn)(void *state, void *arg);
+ /** Function to run while processing the reply queue. */
void (*reply_fn)(void *arg);
+ /** Argument for the above functions. */
void *arg;
};
struct replyqueue_s {
+ /** Mutex to protect the answers field */
tor_mutex_t lock;
+ /** Doubly-linked list of answers that the reply queue needs to handle. */
TOR_TAILQ_HEAD(, workqueue_entry_s) answers;
- alert_sockets_t alert; // lock not held on this.
+ /** Mechanism to wake up the main thread when it is receiving answers. */
+ alert_sockets_t alert;
};
+/** A worker thread represents a single thread in a thread pool. To avoid
+ * contention, each gets its own queue. This breaks the guarantee that that
+ * queued work will get executed strictly in order. */
typedef struct workerthread_s {
+ /** Lock to protect all fields of this thread and its queue. */
tor_mutex_t lock;
+ /** Condition variable that we wait on when we have no work, and which
+ * gets signaled when our queue becomes nonempty. */
tor_cond_t condition;
+ /** Queue of pending work that we have to do. */
TOR_TAILQ_HEAD(, workqueue_entry_s) work;
+ /** True iff this thread is currently in its loop. */
unsigned is_running;
+ /** True iff this thread has crashed or is shut down for some reason. */
unsigned is_shut_down;
+ /** True if we're waiting for more elements to get added to the queue. */
unsigned waiting;
+ /** User-supplied state field that we pass to the worker functions of each
+ * work item. */
void *state;
+ /** Reply queue to which we pass our results. */
replyqueue_t *reply_queue;
} workerthread_t;
-struct threadpool_s {
- workerthread_t **threads;
- int next_for_work;
-
- tor_mutex_t lock;
- int n_threads;
-
- replyqueue_t *reply_queue;
-
- void *(*new_thread_state_fn)(void*);
- void (*free_thread_state_fn)(void*);
- void *new_thread_state_arg;
-
-};
-
static void queue_reply(replyqueue_t *queue, workqueue_entry_t *work);
+/** Allocate and return a new workqueue_entry_t, set up to run the function
+ * <b>fn</b> in the worker thread, and <b>reply_fn</b> in the main
+ * thread. See threadpool_queue_work() for full documentation. */
static workqueue_entry_t *
workqueue_entry_new(int (*fn)(void*, void*),
void (*reply_fn)(void*),
@@ -82,6 +99,10 @@ workqueue_entry_new(int (*fn)(void*, void*),
return ent;
}
+/**
+ * Release all storage held in <b>ent</b>. Call only when <b>ent</b> is not on
+ * any queue.
+ */
static void
workqueue_entry_free(workqueue_entry_t *ent)
{
@@ -90,6 +111,20 @@ workqueue_entry_free(workqueue_entry_t *ent)
tor_free(ent);
}
+/**
+ * Cancel a workqueue_entry_t that has been returned from
+ * threadpool_queue_work.
+ *
+ * You must not call this function on any work whose reply function has been
+ * executed in the main thread; that will cause undefined behavior (probably,
+ * a crash).
+ *
+ * If the work is cancelled, this function return 1. It is the caller's
+ * responsibility to free any storage in the work function's arguments.
+ *
+ * This function will have no effect if the worker thread has already executed
+ * or begun to execute the work item. In that case, it will return 0.
+ */
int
workqueue_entry_cancel(workqueue_entry_t *ent)
{
@@ -107,6 +142,9 @@ workqueue_entry_cancel(workqueue_entry_t *ent)
return cancelled;
}
+/**
+ * Main function for the worker thread.
+ */
static void
worker_thread_main(void *thread_)
{
@@ -115,23 +153,26 @@ worker_thread_main(void *thread_)
int result;
tor_mutex_acquire(&thread->lock);
-
thread->is_running = 1;
while (1) {
- /* lock held. */
+ /* lock must be held at this point. */
while (!TOR_TAILQ_EMPTY(&thread->work)) {
- /* lock held. */
+ /* lock must be held at this point. */
work = TOR_TAILQ_FIRST(&thread->work);
TOR_TAILQ_REMOVE(&thread->work, work, next_work);
work->pending = 0;
tor_mutex_release(&thread->lock);
+ /* We run the work function without holding the thread lock. This
+ * is the main thread's first opportunity to give us more work. */
result = work->fn(thread->state, work->arg);
+ /* Queue the reply for the main thread. */
queue_reply(thread->reply_queue, work);
tor_mutex_acquire(&thread->lock);
+ /* We may need to exit the thread. */
if (result >= WQ_RPL_ERROR) {
thread->is_running = 0;
thread->is_shut_down = 1;
@@ -139,19 +180,23 @@ worker_thread_main(void *thread_)
return;
}
}
- /* Lock held; no work in this thread's queue. */
+ /* At this point the lock is held, and there is no work in this thread's
+ * queue. */
/* TODO: Try work-stealing. */
-
/* TODO: support an idle-function */
+ /* Okay. Now, wait till somebody has work for us. */
thread->waiting = 1;
- if (tor_cond_wait(&thread->condition, &thread->lock, NULL) < 0)
- /* ERR */
+ if (tor_cond_wait(&thread->condition, &thread->lock, NULL) < 0) {
+ /* XXXX ERROR */
+ }
thread->waiting = 0;
}
}
+/** Put a reply on the reply queue. The reply must not currently be on
+ * any thread's work queue. */
static void
queue_reply(replyqueue_t *queue, workqueue_entry_t *work)
{
@@ -168,6 +213,8 @@ queue_reply(replyqueue_t *queue, workqueue_entry_t *work)
}
}
+/** Allocate and start a new worker thread to use state object <b>state</b>,
+ * and send responses to <b>replyqueue</b>. */
static workerthread_t *
workerthread_new(void *state, replyqueue_t *replyqueue)
{
@@ -186,6 +233,10 @@ workerthread_new(void *state, replyqueue_t *replyqueue)
return thr;
}
+/**
+ * Add an item of work to a single worker thread. See threadpool_queue_work(*)
+ * for arguments.
+ */
static workqueue_entry_t *
workerthread_queue_work(workerthread_t *worker,
int (*fn)(void *, void *),
@@ -206,6 +257,23 @@ workerthread_queue_work(workerthread_t *worker,
return ent;
}
+/**
+ * Queue an item of work for a thread in a thread pool. The function
+ * <b>fn</b> will be run in a worker thread, and will receive as arguments the
+ * thread's state object, and the provided object <b>arg</b>. It must return
+ * one of WQ_RPL_REPLY, WQ_RPL_ERROR, or WQ_RPL_SHUTDOWN.
+ *
+ * Regardless of its return value, the function <b>reply_fn</b> will later be
+ * run in the main thread when it invokes replyqueue_process(), and will
+ * receive as its argument the same <b>arg</b> object. It's the reply
+ * function's responsibility to free the work object.
+ *
+ * On success, return a workqueue_entry_t object that can be passed to
+ * workqueue_entry_cancel(). On failure, return NULL.
+ *
+ * Note that because each thread has its own work queue, work items may not
+ * be executed strictly in order.
+ */
workqueue_entry_t *
threadpool_queue_work(threadpool_t *pool,
int (*fn)(void *, void *),
@@ -215,6 +283,7 @@ threadpool_queue_work(threadpool_t *pool,
workerthread_t *worker;
tor_mutex_acquire(&pool->lock);
+ /* Pick the next thread in random-access order. */
worker = pool->threads[pool->next_for_work++];
if (!worker) {
tor_mutex_release(&pool->lock);
@@ -227,9 +296,19 @@ threadpool_queue_work(threadpool_t *pool,
return workerthread_queue_work(worker, fn, reply_fn, arg);
}
+/**
+ * Queue a copy of a work item for every thread in a pool. This can be used,
+ * for example, to tell the threads to update some parameter in their states.
+ *
+ * Arguments are as for <b>threadpool_queue_work</b>, except that the
+ * <b>arg</b> value is passed to <b>dup_fn</b> once per each thread to
+ * make a copy of it.
+ *
+ * Return 0 on success, -1 on failure.
+ */
int
threadpool_queue_for_all(threadpool_t *pool,
- void *(*dup_fn)(void *),
+ void *(*dup_fn)(const void *),
int (*fn)(void *, void *),
void (*reply_fn)(void *),
void *arg)
@@ -251,6 +330,7 @@ threadpool_queue_for_all(threadpool_t *pool,
}
}
+/** Launch threads until we have <b>n</b>. */
static int
threadpool_start_threads(threadpool_t *pool, int n)
{
@@ -274,6 +354,13 @@ threadpool_start_threads(threadpool_t *pool, int n)
return 0;
}
+/**
+ * Construct a new thread pool with <b>n</b> worker threads, configured to
+ * send their output to <b>replyqueue</b>. The threads' states will be
+ * constructed with the <b>new_thread_state_fn</b> call, receiving <b>arg</b>
+ * as its argument. When the threads close, they will call
+ * <b>free_thread_state_fn</b> on their states.
+ */
threadpool_t *
threadpool_new(int n_threads,
replyqueue_t *replyqueue,
@@ -298,12 +385,17 @@ threadpool_new(int n_threads,
return pool;
}
+/** Return the reply queue associated with a given thread pool. */
replyqueue_t *
threadpool_get_replyqueue(threadpool_t *tp)
{
return tp->reply_queue;
}
+/** Allocate a new reply queue. Reply queues are used to pass results from
+ * worker threads to the main thread. Since the main thread is running an
+ * IO-centric event loop, it needs to get woken up with means other than a
+ * condition variable. */
replyqueue_t *
replyqueue_new(void)
{
@@ -321,12 +413,22 @@ replyqueue_new(void)
return rq;
}
+/**
+ * Return the "read socket" for a given reply queue. The main thread should
+ * listen for read events on this socket, and call replyqueue_process() every
+ * time it triggers.
+ */
tor_socket_t
replyqueue_get_socket(replyqueue_t *rq)
{
return rq->alert.read_fd;
}
+/**
+ * Process all pending replies on a reply queue. The main thread should call
+ * this function every time the socket returned by replyqueue_get_socket() is
+ * readable.
+ */
void
replyqueue_process(replyqueue_t *queue)
{
@@ -336,7 +438,7 @@ replyqueue_process(replyqueue_t *queue)
tor_mutex_acquire(&queue->lock);
while (!TOR_TAILQ_EMPTY(&queue->answers)) {
- /* lock held. */
+ /* lock must be held at this point.*/
workqueue_entry_t *work = TOR_TAILQ_FIRST(&queue->answers);
TOR_TAILQ_REMOVE(&queue->answers, work, next_work);
tor_mutex_release(&queue->lock);
diff --git a/src/common/workqueue.h b/src/common/workqueue.h
index 684fb19..dca947e 100644
--- a/src/common/workqueue.h
+++ b/src/common/workqueue.h
@@ -6,15 +6,21 @@
#include "compat.h"
+/** A replyqueue is used to tell the main thread about the outcome of
+ * work that we queued for the the workers. */
typedef struct replyqueue_s replyqueue_t;
+/** A thread-pool manages starting threads and passing work to them. */
typedef struct threadpool_s threadpool_t;
+/** A workqueue entry represents a request that has been passed to a thread
+ * pool. */
typedef struct workqueue_entry_s workqueue_entry_t;
-#define WQ_CMD_RUN 0
-#define WQ_CMD_CANCEL 1
-
+/** Possible return value from a work function: indicates success. */
#define WQ_RPL_REPLY 0
+/** Possible return value from a work function: indicates fatal error */
#define WQ_RPL_ERROR 1
+/** Possible return value from a work function: indicates thread is shutting
+ * down. */
#define WQ_RPL_SHUTDOWN 2
workqueue_entry_t *threadpool_queue_work(threadpool_t *pool,
@@ -22,7 +28,7 @@ workqueue_entry_t *threadpool_queue_work(threadpool_t *pool,
void (*reply_fn)(void *),
void *arg);
int threadpool_queue_for_all(threadpool_t *pool,
- void *(*dup_fn)(void *),
+ void *(*dup_fn)(const void *),
int (*fn)(void *, void *),
void (*reply_fn)(void *),
void *arg);
More information about the tor-commits
mailing list