From 38d105dede5f423217462c94e71768f2811a39ce Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?P=C5=99emysl=20Janouch?=
Date: Sat, 16 Jan 2016 06:00:41 +0100
Subject: [PATCH] Don't crash when new threads can't be created
---
liberty.c | 64 ++++++++++++++++++++++++++++++++++++++++++++++++++-----
1 file changed, 59 insertions(+), 5 deletions(-)
diff --git a/liberty.c b/liberty.c
index e004464..fd9ccc7 100644
--- a/liberty.c
+++ b/liberty.c
@@ -1073,6 +1073,7 @@ struct async
// "cancelled" may not be accesed or modified by the worker thread
pthread_t worker; ///< Worker thread ID
+ bool started; ///< Worker thread ID is valid
bool cancelled; ///< Task has been cancelled
async_fn execute; ///< Worker main function
@@ -1087,6 +1088,8 @@ async_init (struct async *self, struct async_manager *manager)
self->manager = manager;
}
+static bool async_run (struct async *self);
+
// - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
struct async_manager
@@ -1095,6 +1098,12 @@ struct async_manager
struct async *running; ///< Queue of running jobs
struct async *finished; ///< Queue of completed/cancelled jobs
+ // It's upon the user to call async_manager_dispatch() to retry the delayed.
+ // It's somewhat questionable if this feature is of any use. Possibly if we
+ // provide a means of actively limiting the amount of running async jobs.
+
+ struct async *delayed; ///< Resource exhaustion queue
+
// We need the pipe in order to abort polling (instead of using EINTR)
pthread_cond_t finished_cond; ///< Signals that a task has finished
@@ -1114,6 +1123,18 @@ async_manager_init (struct async_manager *self)
set_cloexec (self->finished_pipe[1]);
}
+static bool
+async_manager_retry (struct async_manager *self, struct async *async)
+{
+ if (async->cancelled)
+ {
+ if (async->destroy)
+ async->destroy (async);
+ return true;
+ }
+ return async_run (async);
+}
+
static struct async *
async_manager_dispatch_fetch (struct async_manager *self)
{
@@ -1145,6 +1166,13 @@ async_manager_dispatch (struct async_manager *self)
if (iter->destroy)
iter->destroy (iter);
}
+
+ LIST_FOR_EACH (struct async, iter, self->delayed)
+ {
+ LIST_UNLINK (self->delayed, iter);
+ if (!async_manager_retry (self, iter))
+ break;
+ }
}
static void
@@ -1164,6 +1192,8 @@ async_manager_cancel_all (struct async_manager *self)
// Mark everything cancelled so that it's not actually dispatched
LIST_FOR_EACH (struct async, iter, self->finished)
iter->cancelled = true;
+ LIST_FOR_EACH (struct async, iter, self->delayed)
+ iter->cancelled = true;
hard_assert (!pthread_mutex_unlock (&self->lock));
async_manager_dispatch (self);
@@ -1187,7 +1217,8 @@ async_manager_free (struct async_manager *self)
static void
async_cancel (struct async *self)
{
- soft_assert (!pthread_cancel (self->worker));
+ if (self->started)
+ soft_assert (!pthread_cancel (self->worker));
self->cancelled = true;
}
@@ -1219,7 +1250,7 @@ async_routine (void *user_data)
return NULL;
}
-static void
+static bool
async_run (struct async *self)
{
hard_assert (!pthread_mutex_lock (&self->manager->lock));
@@ -1231,11 +1262,24 @@ async_run (struct async *self)
hard_assert (!sigfillset (&all_blocked));
hard_assert (!pthread_sigmask (SIG_SETMASK, &all_blocked, &old_blocked));
- hard_assert (!pthread_create (&self->worker, NULL,
- async_routine, self));
+ int error = pthread_create (&self->worker, NULL, async_routine, self);
// Now that we've created the thread, resume signal processing as usual
hard_assert (!pthread_sigmask (SIG_SETMASK, &old_blocked, NULL));
+
+ if (error)
+ {
+ hard_assert (error == EAGAIN);
+
+ hard_assert (!pthread_mutex_lock (&self->manager->lock));
+ LIST_UNLINK (self->manager->running, self);
+ hard_assert (!pthread_mutex_unlock (&self->manager->lock));
+
+ // FIXME: we probably want to have some kind of a limit on the queue
+ LIST_PREPEND (self->manager->delayed, self);
+ return false;
+ }
+ return (self->started = true);
}
#endif // LIBERTY_WANT_ASYNC
@@ -2138,7 +2182,17 @@ poller_common_free (struct poller_common *self)
static int
poller_common_get_timeout (struct poller_common *self)
{
- return self->idle ? 0 : poller_timers_get_poll_timeout (&self->timers);
+ if (self->idle)
+ return 0;
+
+ int timeout = poller_timers_get_poll_timeout (&self->timers);
+#ifdef LIBERTY_WANT_ASYNC
+ // This is completely arbitrary, in general we have no idea when to retry,
+ // however one second doesn't sound like a particularly bad number
+ if (self->async.delayed)
+ timeout = MIN (timeout, 1000);
+#endif // LIBERTY_WANT_ASYNC
+ return timeout;
}
static void