-remove trailing whitespace
[oweals/gnunet.git] / src / arm / gnunet-service-arm.c
index 9643273cfaafd1ffdaca679921d226f76fc8c4f8..1196b20aa7242716a4bc1910348684d70a92a9c0 100644 (file)
@@ -1,10 +1,10 @@
 /*
      This file is part of GNUnet.
-     (C) 2009 Christian Grothoff (and other contributing authors)
+     (C) 2009, 2010, 2011 Christian Grothoff (and other contributing authors)
 
      GNUnet is free software; you can redistribute it and/or modify
      it under the terms of the GNU General Public License as published
-     by the Free Software Foundation; either version 2, or (at your
+     by the Free Software Foundation; either version 3, or (at your
      option) any later version.
 
      GNUnet is distributed in the hope that it will be useful, but
  * @file arm/gnunet-service-arm.c
  * @brief the automated restart manager service
  * @author Christian Grothoff
- *
- * TODO:
- * - multiple start-stop requests with RC>1 can result
- *   in UP/DOWN signals based on "pending" that are inaccurate...
- *   => have list of clients waiting for a resolution instead of
- *      giving instant (but incorrect) replies
- * - code could go into restart-loop for a service
- *   if service crashes instantly -- need exponential back-off
- * - need to test auto-restart code on configuration changes;
- * - should refine restart code to check if *relevant* parts of the
- *   configuration were changed (anything in the section for the service)
- * - should have a way to specify dependencies between services and
- *   manage restarts of groups of services
  */
 #include "platform.h"
-#include "gnunet_client_lib.h"
-#include "gnunet_getopt_lib.h"
-#include "gnunet_os_lib.h"
+#include "gnunet_util_lib.h"
+#include "gnunet_arm_service.h"
 #include "gnunet_protocols.h"
-#include "gnunet_service_lib.h"
 #include "arm.h"
 
+/**
+ * How many messages do we queue up at most for optional
+ * notifications to a client?  (this can cause notifications
+ * about outgoing messages to be dropped).
+ */
+#define MAX_NOTIFY_QUEUE 1024
 
 /**
- * Run maintenance every second.
+ * List of our services.
  */
-#define MAINT_FREQUENCY GNUNET_TIME_UNIT_SECONDS
+struct ServiceList;
+
 
 /**
- * How long do we wait until we decide that a service
- * did not start?
+ * Record with information about a listen socket we have open.
  */
-#define CHECK_TIMEOUT GNUNET_TIME_UNIT_MINUTES
+struct ServiceListeningInfo
+{
+  /**
+   * This is a linked list.
+   */
+  struct ServiceListeningInfo *next;
 
-struct ServiceList;
+  /**
+   * This is a linked list.
+   */
+  struct ServiceListeningInfo *prev;
+
+  /**
+   * Address this socket is listening on.
+   */
+  struct sockaddr *service_addr;
+
+  /**
+   * Service this listen socket is for.
+   */
+  struct ServiceList *sl;
+
+  /**
+   * Number of bytes in 'service_addr'
+   */
+  socklen_t service_addr_len;
+
+  /**
+   * Our listening socket.
+   */
+  struct GNUNET_NETWORK_Handle *listen_socket;
+
+  /**
+   * Task doing the accepting.
+   */
+  GNUNET_SCHEDULER_TaskIdentifier accept_task;
+
+};
 
-typedef void (*CleanCallback) (void *cls, struct ServiceList * pos);
 
 /**
  * List of our services.
@@ -66,10 +91,25 @@ typedef void (*CleanCallback) (void *cls, struct ServiceList * pos);
 struct ServiceList
 {
   /**
-   * This is a linked list.
+   * This is a doubly-linked list.
    */
   struct ServiceList *next;
 
+  /**
+   * This is a doubly-linked list.
+   */
+  struct ServiceList *prev;
+
+  /**
+   * Linked list of listen sockets associated with this service.
+   */
+  struct ServiceListeningInfo *listen_head;
+
+  /**
+   * Linked list of listen sockets associated with this service.
+   */
+  struct ServiceListeningInfo *listen_tail;
+
   /**
    * Name of the service.
    */
@@ -86,613 +126,1314 @@ struct ServiceList
   char *config;
 
   /**
-   * Function to call upon kill completion (waitpid), NULL
+   * Client to notify upon kill completion (waitpid), NULL
    * if we should simply restart the process.
    */
-  CleanCallback kill_continuation;
+  struct GNUNET_SERVER_Client *killing_client;
+
+  /**
+   * ID of the request that killed the service (for reporting back).
+   */
+  uint64_t killing_client_request_id;
 
   /**
-   * Closure for kill_continuation.
+   * Process structure pointer of the child.
    */
-  void *kill_continuation_cls;
+  struct GNUNET_OS_Process *proc;
 
   /**
-   * Process ID of the child.
+   * Process exponential backoff time
    */
-  pid_t pid;
+  struct GNUNET_TIME_Relative backoff;
 
   /**
-   * Last time the config of this service was
-   * modified.
+   * Absolute time at which the process is scheduled to restart in case of death
    */
-  time_t mtime;
+  struct GNUNET_TIME_Absolute restart_at;
 
   /**
-   * Reference counter (counts how many times we've been
-   * asked to start the service).  We only actually stop
-   * it once rc hits zero.
+   * Time we asked the service to shut down (used to calculate time it took
+   * the service to terminate).
    */
-  unsigned int rc;
+  struct GNUNET_TIME_Absolute killed_at;
 
+  /**
+   * Is this service to be started by default (or did a client tell us explicitly
+   * to start it)?  GNUNET_NO if the service is started only upon 'accept' on a
+   * listen socket or possibly explicitly by a client changing the value.
+   */
+  int is_default;
+
+  /**
+   * Should we use pipes to signal this process? (YES for Java binaries and if we
+   * are on Windoze).
+   */
+  int pipe_control;
 };
 
 /**
  * List of running services.
  */
-static struct ServiceList *running;
+static struct ServiceList *running_head;
 
 /**
- * Our configuration
+ * List of running services.
  */
-static struct GNUNET_CONFIGURATION_Handle *cfg;
+static struct ServiceList *running_tail;
 
 /**
- * Our scheduler.
+ * Our configuration
  */
-static struct GNUNET_SCHEDULER_Handle *sched;
+static const struct GNUNET_CONFIGURATION_Handle *cfg;
 
 /**
  * Command to prepend to each actual command.
  */
 static char *prefix_command;
 
+/**
+ * Option to append to each actual command.
+ */
+static char *final_option;
+
+/**
+ * ID of task called whenever we get a SIGCHILD.
+ */
+static GNUNET_SCHEDULER_TaskIdentifier child_death_task;
+
+/**
+ * ID of task called whenever the timeout for restarting a child
+ * expires.
+ */
+static GNUNET_SCHEDULER_TaskIdentifier child_restart_task;
+
+/**
+ * Pipe used to communicate shutdown via signal.
+ */
+static struct GNUNET_DISK_PipeHandle *sigpipe;
+
+/**
+ * Are we in shutdown mode?
+ */
+static int in_shutdown;
 
+/**
+ * Handle to our server instance.  Our server is a bit special in that
+ * its service is not immediately stopped once we get a shutdown
+ * request (since we need to continue service until all of our child
+ * processes are dead).  This handle is used to shut down the server
+ * (and thus trigger process termination) once all child processes are
+ * also dead.  A special option in the ARM configuration modifies the
+ * behaviour of the service implementation to not do the shutdown
+ * immediately.
+ */
+static struct GNUNET_SERVER_Handle *server;
+
+/**
+ * Context for notifications we need to send to our clients.
+ */
+static struct GNUNET_SERVER_NotificationContext *notifier;
+
+
+#include "do_start_process.c"
+
+/**
+ * Transmit a status result message.
+ *
+ * @param cls a `unit16_t *` with message type
+ * @param size number of bytes available in @a buf
+ * @param buf where to copy the message, NULL on error
+ * @return number of bytes copied to @a buf
+ */
 static size_t
 write_result (void *cls, size_t size, void *buf)
 {
-  uint16_t *res = cls;
-  struct GNUNET_MessageHeader *msg;
+  struct GNUNET_ARM_ResultMessage *msg = cls;
+  size_t msize;
 
   if (buf == NULL)
-    return 0;                   /* error, not much we can do */
-  GNUNET_assert (size >= sizeof (struct GNUNET_MessageHeader));
-  msg = buf;
-  msg->size = htons (sizeof (struct GNUNET_MessageHeader));
-  msg->type = htons (*res);
-  GNUNET_free (res);
-  return sizeof (struct GNUNET_MessageHeader);
+  {
+    GNUNET_log (GNUNET_ERROR_TYPE_WARNING,
+               _("Could not send status result to client\n"));
+    GNUNET_free (msg);
+    return 0;                  /* error, not much we can do */
+  }
+  GNUNET_log (GNUNET_ERROR_TYPE_DEBUG,
+             "Sending status response %u to client\n",
+             (unsigned int) msg->result);
+  msize = msg->arm_msg.header.size;
+  GNUNET_assert (size >= msize);
+  msg->arm_msg.header.size = htons (msg->arm_msg.header.size);
+  msg->arm_msg.header.type = htons (msg->arm_msg.header.type);
+  msg->result = htonl (msg->result);
+  msg->arm_msg.request_id = GNUNET_htonll (msg->arm_msg.request_id);
+  memcpy (buf, msg, msize);
+  GNUNET_free (msg);
+  return msize;
 }
 
 
-
 /**
- * Signal our client that we will start or stop the
- * service.
+ * Transmit the list of running services.
  *
- * @return NULL if it was not found
+ * @param cls pointer to `struct GNUNET_ARM_ListResultMessage` with the message
+ * @param size number of bytes available in @a buf
+ * @param buf where to copy the message, NULL on error
+ * @return number of bytes copied to @a buf
  */
-static void
-signal_result (struct GNUNET_SERVER_Client *client,
-               const char *name, uint16_t result)
+static size_t
+write_list_result (void *cls, size_t size, void *buf)
 {
-  uint16_t *res;
+  struct GNUNET_ARM_ListResultMessage *msg = cls;
+  size_t rslt_size;
 
-#if DEBUG_ARM
-  GNUNET_log (GNUNET_ERROR_TYPE_DEBUG,
-              "Telling client that service `%s' is now %s\n",
-              name,
-              result == GNUNET_MESSAGE_TYPE_ARM_IS_DOWN ? "down" : "up");
-#endif
-  res = GNUNET_malloc (sizeof (uint16_t));
-  *res = result;
-  GNUNET_SERVER_notify_transmit_ready (client,
-                                       sizeof (struct GNUNET_MessageHeader),
-                                       GNUNET_TIME_UNIT_FOREVER_REL,
-                                       &write_result, res);
+  if (buf == NULL)
+  {
+    GNUNET_log (GNUNET_ERROR_TYPE_WARNING,
+                _("Could not send list result to client\n"));
+    GNUNET_free (msg);
+    return 0;                   /* error, not much we can do */
+  }
+
+  rslt_size = msg->arm_msg.header.size;
+  GNUNET_assert (size >= rslt_size);
+  msg->arm_msg.header.size = htons (msg->arm_msg.header.size);
+  msg->arm_msg.header.type = htons (msg->arm_msg.header.type);
+  msg->arm_msg.request_id = GNUNET_htonll (msg->arm_msg.request_id);
+  msg->count = htons (msg->count);
+
+  memcpy (buf, msg, rslt_size);
+  GNUNET_free (msg);
+  return rslt_size;
 }
 
 
 /**
- * Find the process with the given service
- * name in the given list, remove it and return it.
+ * Signal our client that we will start or stop the
+ * service.
  *
+ * @param client who is being signalled
+ * @param name name of the service
+ * @param request_id id of the request that is being responded to.
+ * @param result message type to send
  * @return NULL if it was not found
  */
-static struct ServiceList *
-find_name (const char *name)
+static void
+signal_result (struct GNUNET_SERVER_Client *client,
+              const char *name,
+              uint64_t request_id,
+              enum GNUNET_ARM_Result result)
 {
-  struct ServiceList *pos;
-  struct ServiceList *prev;
-
-  pos = running;
-  prev = NULL;
-  while (pos != NULL)
-    {
-      if (0 == strcmp (pos->name, name))
-        {
-          if (prev == NULL)
-            running = pos->next;
-          else
-            prev->next = pos->next;
-          pos->next = NULL;
-          return pos;
-        }
-      prev = pos;
-      pos = pos->next;
-    }
-  return NULL;
+  struct GNUNET_ARM_ResultMessage *msg;
+  size_t msize;
+
+  msize = sizeof (struct GNUNET_ARM_ResultMessage);
+  msg = GNUNET_malloc (msize);
+  msg->arm_msg.header.size = msize;
+  msg->arm_msg.header.type = GNUNET_MESSAGE_TYPE_ARM_RESULT;
+  msg->result = result;
+  msg->arm_msg.request_id = request_id;
+
+  GNUNET_SERVER_notify_transmit_ready (client, msize,
+                                      GNUNET_TIME_UNIT_FOREVER_REL,
+                                      write_result, msg);
 }
 
 
+/**
+ * Tell all clients about status change of a service.
+ *
+ * @param name name of the service
+ * @param status message type to send
+ * @param unicast if not NULL, send to this client only.
+ *                otherwise, send to all clients in the notifier
+ */
 static void
-free_entry (struct ServiceList *pos)
+broadcast_status (const char *name,
+                 enum GNUNET_ARM_ServiceStatus status,
+                 struct GNUNET_SERVER_Client *unicast)
 {
-  GNUNET_free_non_null (pos->config);
-  GNUNET_free_non_null (pos->binary);
-  GNUNET_free (pos->name);
-  GNUNET_free (pos);
-}
-
+  struct GNUNET_ARM_StatusMessage *msg;
+  size_t namelen;
 
+  if (NULL == notifier)
+    return;
+  GNUNET_log (GNUNET_ERROR_TYPE_DEBUG,
+      "Sending status %u of service `%s' to client\n",
+      (unsigned int) status, name);
+  namelen = strlen (name);
+  msg = GNUNET_malloc (sizeof (struct GNUNET_ARM_StatusMessage) + namelen + 1);
+  msg->header.size = htons (sizeof (struct GNUNET_ARM_StatusMessage) + namelen + 1);
+  msg->header.type = htons (GNUNET_MESSAGE_TYPE_ARM_STATUS);
+  msg->status = htonl ((uint32_t) (status));
+  memcpy ((char *) &msg[1], name, namelen + 1);
+
+  if (NULL == unicast)
+    GNUNET_SERVER_notification_context_broadcast (notifier,
+        (struct GNUNET_MessageHeader *) msg, GNUNET_YES);
+  else
+    GNUNET_SERVER_notification_context_unicast (notifier, unicast,
+        (const struct GNUNET_MessageHeader *) msg, GNUNET_NO);
+  GNUNET_free (msg);
+}
 
 
 /**
  * Actually start the process for the given service.
  *
  * @param sl identifies service to start
+ * @param client that asked to start the service (may be NULL)
+ * @param request_id id of the request in response to which the process is
+ *                   being started. 0 if starting was not requested.
  */
 static void
-start_process (struct ServiceList *sl)
+start_process (struct ServiceList *sl, struct GNUNET_SERVER_Client *client, uint64_t request_id)
 {
   char *loprefix;
   char *options;
-  char **argv;
-  unsigned int argv_size;
-  char *lopos;
   char *optpos;
-  const char *firstarg;
+  char *optend;
+  const char *next;
   int use_debug;
+  char b;
+  char *val;
+  struct ServiceListeningInfo *sli;
+  SOCKTYPE *lsocks;
+  unsigned int ls;
+  char *binary;
 
-  /* start service */
+  /* calculate listen socket list */
+  lsocks = NULL;
+  ls = 0;
+  for (sli = sl->listen_head; NULL != sli; sli = sli->next)
+    {
+      GNUNET_array_append (lsocks, ls,
+                          GNUNET_NETWORK_get_fd (sli->listen_socket));
+      if (sli->accept_task != GNUNET_SCHEDULER_NO_TASK)
+       {
+         GNUNET_SCHEDULER_cancel (sli->accept_task);
+         sli->accept_task = GNUNET_SCHEDULER_NO_TASK;
+       }
+    }
+#if WINDOWS
+  GNUNET_array_append (lsocks, ls, INVALID_SOCKET);
+#else
+  GNUNET_array_append (lsocks, ls, -1);
+#endif
+
+  /* obtain configuration */
   if (GNUNET_OK !=
-      GNUNET_CONFIGURATION_get_value_string (cfg,
-                                             sl->name, "PREFIX", &loprefix))
+      GNUNET_CONFIGURATION_get_value_string (cfg, sl->name, "PREFIX",
+                                            &loprefix))
     loprefix = GNUNET_strdup (prefix_command);
   if (GNUNET_OK !=
-      GNUNET_CONFIGURATION_get_value_string (cfg,
-                                             sl->name, "OPTIONS", &options))
-    options = GNUNET_strdup ("");
-  use_debug = GNUNET_CONFIGURATION_get_value_yesno (cfg, sl->name, "DEBUG");
-
-  GNUNET_log (GNUNET_ERROR_TYPE_INFO, _("Starting service `%s'\n"), sl->name);
-#if DEBUG_ARM
-  GNUNET_log (GNUNET_ERROR_TYPE_DEBUG,
-              "Starting service `%s' using binary `%s' and configuration `%s'\n",
-              sl->name, sl->binary, sl->config);
-#endif
-  argv_size = 6;
-  if (use_debug)
-    argv_size += 2;
-  lopos = loprefix;
-  while ('\0' != *lopos)
-    {
-      if (*lopos == ' ')
-        argv_size++;
-      lopos++;
-    }
-  optpos = options;
-  while ('\0' != *optpos)
+      GNUNET_CONFIGURATION_get_value_string (cfg, sl->name, "OPTIONS",
+                                            &options))
     {
-      if (*optpos == ' ')
-        argv_size++;
-      optpos++;
+      options = GNUNET_strdup (final_option);
+      if (NULL == strstr (options, "%"))
+       {
+         /* replace '{}' with service name */
+         while (NULL != (optpos = strstr (options, "{}")))
+           {
+             optpos[0] = '%';
+             optpos[1] = 's';
+             GNUNET_asprintf (&optpos, options, sl->name);
+             GNUNET_free (options);
+             options = optpos;
+           }
+         /* replace '$PATH' with value associated with "PATH" */
+         while (NULL != (optpos = strstr (options, "$")))
+           {
+             optend = optpos + 1;
+             while (isupper ((unsigned char) *optend))
+               optend++;
+             b = *optend;
+             if ('\0' == b)
+               next = "";
+             else
+               next = optend + 1;
+             *optend = '\0';
+             if (GNUNET_OK !=
+                 GNUNET_CONFIGURATION_get_value_string (cfg, "PATHS",
+                                                        optpos + 1, &val))
+               val = GNUNET_strdup ("");
+             *optpos = '\0';
+             GNUNET_asprintf (&optpos, "%s%s%c%s", options, val, b, next);
+             GNUNET_free (options);
+             GNUNET_free (val);
+             options = optpos;
+           }
+       }
     }
-  firstarg = NULL;
-  argv = GNUNET_malloc (argv_size * sizeof (char *));
-  argv_size = 0;
-  lopos = loprefix;
+  use_debug = GNUNET_CONFIGURATION_get_value_yesno (cfg, sl->name, "DEBUG");
 
-  while ('\0' != *lopos)
-    {
-      while (*lopos == ' ')
-        lopos++;
-      if (*lopos == '\0')
-        continue;
-      if (argv_size == 0)
-        firstarg = lopos;
-      argv[argv_size++] = lopos;
-      while (('\0' != *lopos) && (' ' != *lopos))
-        lopos++;
-      if ('\0' == *lopos)
-        continue;
-      *lopos = '\0';
-      lopos++;
-    }
-  if (argv_size == 0)
-    firstarg = sl->binary;
-  argv[argv_size++] = sl->binary;
-  argv[argv_size++] = "-c";
-  argv[argv_size++] = sl->config;
+  /* actually start process */
+  GNUNET_log (GNUNET_ERROR_TYPE_DEBUG,
+             "Starting service `%s' using binary `%s' and configuration `%s'\n",
+             sl->name, sl->binary, sl->config);
+  binary = GNUNET_OS_get_libexec_binary_path (sl->binary);
+  GNUNET_assert (NULL == sl->proc);
   if (GNUNET_YES == use_debug)
-    {
-      argv[argv_size++] = "-L";
-      argv[argv_size++] = "DEBUG";
-    }
-  optpos = options;
-  while ('\0' != *optpos)
-    {
-      while (*optpos == ' ')
-        optpos++;
-      if (*optpos == '\0')
-        continue;
-      argv[argv_size++] = optpos;
-      while (('\0' != *optpos) && (' ' != *optpos))
-        optpos++;
-      if ('\0' == *optpos)
-        continue;
-      *optpos = '\0';
-      optpos++;
-    }
-  argv[argv_size++] = NULL;
-  sl->pid = GNUNET_OS_start_process_v (firstarg, argv);
-  GNUNET_free (argv);
+  {
+    if (NULL == sl->config)
+      sl->proc =
+       do_start_process (sl->pipe_control, GNUNET_OS_INHERIT_STD_OUT_AND_ERR,
+                         lsocks, loprefix, binary, "-L",
+                         "DEBUG", options, NULL);
+    else
+      sl->proc =
+       do_start_process (sl->pipe_control, GNUNET_OS_INHERIT_STD_OUT_AND_ERR,
+                         lsocks, loprefix, binary, "-c", sl->config, "-L",
+                         "DEBUG", options, NULL);
+  }
+  else
+  {
+    if (NULL == sl->config)
+      sl->proc =
+       do_start_process (sl->pipe_control, GNUNET_OS_INHERIT_STD_OUT_AND_ERR,
+                         lsocks, loprefix, binary,
+                         options, NULL);
+    else
+      sl->proc =
+       do_start_process (sl->pipe_control, GNUNET_OS_INHERIT_STD_OUT_AND_ERR,
+                         lsocks, loprefix, binary, "-c", sl->config,
+                         options, NULL);
+  }
+  GNUNET_free (binary);
+  if (sl->proc == NULL)
+  {
+    GNUNET_log (GNUNET_ERROR_TYPE_ERROR, _("Failed to start service `%s'\n"),
+               sl->name);
+    if (client)
+      signal_result (client, sl->name, request_id, GNUNET_ARM_RESULT_START_FAILED);
+  }
+  else
+  {
+    GNUNET_log (GNUNET_ERROR_TYPE_INFO, _("Starting service `%s'\n"),
+               sl->name);
+    broadcast_status (sl->name, GNUNET_ARM_SERVICE_STARTING, NULL);
+    if (client)
+      signal_result (client, sl->name, request_id, GNUNET_ARM_RESULT_STARTING);
+  }
+  /* clean up */
   GNUNET_free (loprefix);
   GNUNET_free (options);
+  GNUNET_array_grow (lsocks, ls, 0);
 }
 
 
 /**
- * Start the specified service.
+ * Find the process with the given service
+ * name in the given list and return it.
+ *
+ * @param name which service entry to look up
+ * @return NULL if it was not found
  */
-static void
-start_service (struct GNUNET_SERVER_Client *client, const char *servicename)
+static struct ServiceList *
+find_service (const char *name)
 {
   struct ServiceList *sl;
-  char *binary;
-  char *config;
-  struct stat sbuf;
-  sl = find_name (servicename);
-  if (sl != NULL)
+
+  sl = running_head;
+  while (sl != NULL)
     {
-      /* already running, just increment RC */
-      GNUNET_log (GNUNET_ERROR_TYPE_INFO,
-                  _("Service `%s' already running.\n"), servicename);
-      sl->rc++;
-      sl->next = running;
-      running = sl;
-      signal_result (client, servicename, GNUNET_MESSAGE_TYPE_ARM_IS_UP);
+      if (0 == strcasecmp (sl->name, name))
+       return sl;
+      sl = sl->next;
+    }
+  return NULL;
+}
+
+
+/**
+ * First connection has come to the listening socket associated with the service,
+ * create the service in order to relay the incoming connection to it
+ *
+ * @param cls callback data, `struct ServiceListeningInfo` describing a listen socket
+ * @param tc context
+ */
+static void
+accept_connection (void *cls, const struct GNUNET_SCHEDULER_TaskContext *tc)
+{
+  struct ServiceListeningInfo *sli = cls;
+  struct ServiceList *sl = sli->sl;
+
+  sli->accept_task = GNUNET_SCHEDULER_NO_TASK;
+  GNUNET_assert (GNUNET_NO == in_shutdown);
+  if (0 != (GNUNET_SCHEDULER_REASON_SHUTDOWN & tc->reason))
+    return;
+  start_process (sl, NULL, 0);
+}
+
+
+/**
+ * Creating a listening socket for each of the service's addresses and
+ * wait for the first incoming connection to it
+ *
+ * @param sa address associated with the service
+ * @param addr_len length of @a sa
+ * @param sl service entry for the service in question
+ */
+static void
+create_listen_socket (struct sockaddr *sa, socklen_t addr_len,
+                     struct ServiceList *sl)
+{
+  static int on = 1;
+  struct GNUNET_NETWORK_Handle *sock;
+  struct ServiceListeningInfo *sli;
+
+  switch (sa->sa_family)
+    {
+    case AF_INET:
+      sock = GNUNET_NETWORK_socket_create (PF_INET, SOCK_STREAM, 0);
+      break;
+    case AF_INET6:
+      sock = GNUNET_NETWORK_socket_create (PF_INET6, SOCK_STREAM, 0);
+      break;
+    case AF_UNIX:
+      if (strcmp (GNUNET_a2s (sa, addr_len), "@") == 0)        /* Do not bind to blank UNIX path! */
+       return;
+      sock = GNUNET_NETWORK_socket_create (PF_UNIX, SOCK_STREAM, 0);
+      break;
+    default:
+      GNUNET_break (0);
+      sock = NULL;
+      errno = EAFNOSUPPORT;
+      break;
+    }
+  if (NULL == sock)
+    {
+      GNUNET_log (GNUNET_ERROR_TYPE_ERROR,
+                 _("Unable to create socket for service `%s': %s\n"),
+                 sl->name, STRERROR (errno));
+      GNUNET_free (sa);
       return;
     }
-  if (GNUNET_OK !=
-      GNUNET_CONFIGURATION_get_value_string (cfg,
-                                             servicename, "BINARY", &binary))
+  if (GNUNET_NETWORK_socket_setsockopt
+      (sock, SOL_SOCKET, SO_REUSEADDR, &on, sizeof (on)) != GNUNET_OK)
+    GNUNET_log_strerror (GNUNET_ERROR_TYPE_ERROR | GNUNET_ERROR_TYPE_BULK,
+                        "setsockopt");
+#ifdef IPV6_V6ONLY
+  if ((sa->sa_family == AF_INET6) &&
+      (GNUNET_NETWORK_socket_setsockopt
+       (sock, IPPROTO_IPV6, IPV6_V6ONLY, &on, sizeof (on)) != GNUNET_OK))
+    GNUNET_log_strerror (GNUNET_ERROR_TYPE_ERROR | GNUNET_ERROR_TYPE_BULK,
+                        "setsockopt");
+#endif
+
+  if (GNUNET_NETWORK_socket_bind
+      (sock, (const struct sockaddr *) sa, addr_len, 0) != GNUNET_OK)
     {
       GNUNET_log (GNUNET_ERROR_TYPE_WARNING,
-                  _("Binary implementing service `%s' not known!\n"),
-                  servicename);
-      signal_result (client, servicename, GNUNET_MESSAGE_TYPE_ARM_IS_DOWN);
+                 _
+                 ("Unable to bind listening socket for service `%s' to address `%s': %s\n"),
+                 sl->name, GNUNET_a2s (sa, addr_len), STRERROR (errno));
+      GNUNET_break (GNUNET_OK == GNUNET_NETWORK_socket_close (sock));
+      GNUNET_free (sa);
       return;
     }
-  if ((GNUNET_OK !=
-       GNUNET_CONFIGURATION_get_value_filename (cfg,
-                                                servicename,
-                                                "CONFIG",
-                                                &config)) ||
-      (0 != STAT (config, &sbuf)))
+  if (GNUNET_NETWORK_socket_listen (sock, 5) != GNUNET_OK)
     {
-      GNUNET_log (GNUNET_ERROR_TYPE_WARNING,
-                  _("Configuration file `%s' for service `%s' not known!\n"),
-                  config, servicename);
-      signal_result (client, servicename, GNUNET_MESSAGE_TYPE_ARM_IS_DOWN);
-      GNUNET_free (binary);
-      GNUNET_free (config);
+      GNUNET_log_strerror (GNUNET_ERROR_TYPE_ERROR, "listen");
+      GNUNET_break (GNUNET_OK == GNUNET_NETWORK_socket_close (sock));
+      GNUNET_free (sa);
       return;
     }
-  sl = GNUNET_malloc (sizeof (struct ServiceList));
-  sl->name = GNUNET_strdup (servicename);
-  sl->next = running;
-  sl->rc = 1;
-  sl->binary = binary;
-  sl->config = config;
-  sl->mtime = sbuf.st_mtime;
-  running = sl;
-  start_process (sl);
-  signal_result (client, servicename, GNUNET_MESSAGE_TYPE_ARM_IS_UP);
+  GNUNET_log (GNUNET_ERROR_TYPE_INFO,
+             _("ARM now monitors connections to service `%s' at `%s'\n"),
+             sl->name, GNUNET_a2s (sa, addr_len));
+  sli = GNUNET_malloc (sizeof (struct ServiceListeningInfo));
+  sli->service_addr = sa;
+  sli->service_addr_len = addr_len;
+  sli->listen_socket = sock;
+  sli->sl = sl;
+  sli->accept_task =
+    GNUNET_SCHEDULER_add_read_net (GNUNET_TIME_UNIT_FOREVER_REL, sock,
+                                  &accept_connection, sli);
+  GNUNET_CONTAINER_DLL_insert (sl->listen_head, sl->listen_tail, sli);
 }
 
 
+/**
+ * Remove and free an entry in the service list.  Listen sockets
+ * must have already been cleaned up.  Only to be called during shutdown.
+ *
+ * @param sl entry to free
+ */
 static void
-free_and_signal (void *cls, struct ServiceList *pos)
+free_service (struct ServiceList *sl)
 {
-  struct GNUNET_SERVER_Client *client = cls;
-  /* find_name will remove "pos" from the list! */
-  GNUNET_assert (pos == find_name (pos->name));
-  GNUNET_log (GNUNET_ERROR_TYPE_INFO, "Service `%s' stopped\n", pos->name);
-  signal_result (client, pos->name, GNUNET_MESSAGE_TYPE_ARM_IS_DOWN);
-  GNUNET_SERVER_receive_done (client, GNUNET_OK);
-  GNUNET_SERVER_client_drop (client);
-  free_entry (pos);
+  GNUNET_assert (GNUNET_YES == in_shutdown);
+  GNUNET_CONTAINER_DLL_remove (running_head, running_tail, sl);
+  GNUNET_assert (NULL == sl->listen_head);
+  GNUNET_free_non_null (sl->config);
+  GNUNET_free_non_null (sl->binary);
+  GNUNET_free (sl->name);
+  GNUNET_free (sl);
 }
 
 
 /**
- * Stop the specified service.
+ * Handle START-message.
+ *
+ * @param cls closure (always NULL)
+ * @param client identification of the client
+ * @param message the actual message
+ * @return #GNUNET_OK to keep the connection open,
+ *         #GNUNET_SYSERR to close it (signal serious error)
  */
 static void
-stop_service (struct GNUNET_SERVER_Client *client, const char *servicename)
+handle_start (void *cls, struct GNUNET_SERVER_Client *client,
+             const struct GNUNET_MessageHeader *message)
 {
-  struct ServiceList *pos;
-  struct GNUNET_CLIENT_Connection *sc;
-
-  GNUNET_log (GNUNET_ERROR_TYPE_INFO,
-              "Preparing to stop `%s'\n", servicename);
-  pos = find_name (servicename);
-  if ((pos != NULL) && (pos->kill_continuation != NULL))
+  const char *servicename;
+  struct ServiceList *sl;
+  uint16_t size;
+  uint64_t request_id;
+  struct GNUNET_ARM_Message *amsg;
+
+  amsg = (struct GNUNET_ARM_Message *) message;
+  request_id = GNUNET_ntohll (amsg->request_id);
+  size = ntohs (amsg->header.size);
+  size -= sizeof (struct GNUNET_ARM_Message);
+  servicename = (const char *) &amsg[1];
+  if ((size == 0) || (servicename[size - 1] != '\0'))
     {
-      /* killing already in progress */
-      signal_result (client, servicename, GNUNET_MESSAGE_TYPE_ARM_IS_DOWN);
+      GNUNET_break (0);
+      GNUNET_SERVER_receive_done (client, GNUNET_SYSERR);
       return;
     }
-  if ((pos != NULL) && (pos->rc > 1))
+  if (GNUNET_YES == in_shutdown)
     {
-      /* RC>1, just decrement RC */
-      pos->rc--;
-      pos->next = running;
-      running = pos;
-      signal_result (client, servicename, GNUNET_MESSAGE_TYPE_ARM_IS_UP);
+      signal_result (client, servicename, request_id, GNUNET_ARM_RESULT_IN_SHUTDOWN);
       GNUNET_SERVER_receive_done (client, GNUNET_OK);
       return;
     }
-  if (pos != NULL)
+  sl = find_service (servicename);
+  if (NULL == sl)
     {
-      if (0 != PLIBC_KILL (pos->pid, SIGTERM))
-        GNUNET_log_strerror (GNUNET_ERROR_TYPE_WARNING, "kill");
-      pos->next = running;
-      running = pos;
-      pos->kill_continuation = &free_and_signal;
-      pos->kill_continuation_cls = client;
-      GNUNET_SERVER_client_keep (client);
+      signal_result (client, servicename, request_id, GNUNET_ARM_RESULT_IS_NOT_KNOWN);
+      GNUNET_SERVER_receive_done (client, GNUNET_OK);
+      return;
     }
-  else
+  sl->is_default = GNUNET_YES;
+  if (sl->proc != NULL)
     {
-      sc = GNUNET_CLIENT_connect (sched, servicename, cfg);
-      GNUNET_CLIENT_service_shutdown (sc);
-      GNUNET_CLIENT_disconnect (sc);
-      signal_result (client, servicename, GNUNET_MESSAGE_TYPE_ARM_IS_DOWN);
+      signal_result (client, servicename, request_id, GNUNET_ARM_RESULT_IS_STARTED_ALREADY);
       GNUNET_SERVER_receive_done (client, GNUNET_OK);
+      return;
     }
+  start_process (sl, client, request_id);
+  GNUNET_SERVER_receive_done (client, GNUNET_OK);
 }
 
 
 /**
- * Handle START-message.
+ * Start a shutdown sequence.
+ *
+ * @param cls closure (refers to service)
+ * @param tc task context
+ */
+static void
+trigger_shutdown (void *cls, const struct GNUNET_SCHEDULER_TaskContext *tc)
+{
+  GNUNET_log (GNUNET_ERROR_TYPE_DEBUG, "Triggering shutdown\n");
+  GNUNET_SCHEDULER_shutdown ();
+}
+
+
+/**
+ * Handle STOP-message.
  *
  * @param cls closure (always NULL)
  * @param client identification of the client
  * @param message the actual message
- * @return GNUNET_OK to keep the connection open,
- *         GNUNET_SYSERR to close it (signal serious error)
+ * @return #GNUNET_OK to keep the connection open,
+ *         #GNUNET_SYSERR to close it (signal serious error)
  */
 static void
-handle_start (void *cls,
-              struct GNUNET_SERVER_Client *client,
-              const struct GNUNET_MessageHeader *message)
+handle_stop (void *cls, struct GNUNET_SERVER_Client *client,
+            const struct GNUNET_MessageHeader *message)
 {
+  struct ServiceList *sl;
   const char *servicename;
   uint16_t size;
-
-  size = ntohs (message->size);
-  size -= sizeof (struct GNUNET_MessageHeader);
-  servicename = (const char *) &message[1];
+  uint64_t request_id;
+  struct GNUNET_ARM_Message *amsg;
+
+  amsg = (struct GNUNET_ARM_Message *) message;
+  request_id = GNUNET_ntohll (amsg->request_id);
+  size = ntohs (amsg->header.size);
+  size -= sizeof (struct GNUNET_ARM_Message);
+  servicename = (const char *) &amsg[1];
   if ((size == 0) || (servicename[size - 1] != '\0'))
     {
       GNUNET_break (0);
       GNUNET_SERVER_receive_done (client, GNUNET_SYSERR);
       return;
     }
-  start_service (client, servicename);
+  GNUNET_log (GNUNET_ERROR_TYPE_INFO,
+             _("Preparing to stop `%s'\n"), servicename);
+  if (0 == strcasecmp (servicename, "arm"))
+  {
+    broadcast_status (servicename, GNUNET_ARM_SERVICE_STOPPING, NULL);
+    signal_result (client, servicename, request_id, GNUNET_ARM_RESULT_STOPPING);
+    GNUNET_SERVER_client_persist_ (client);
+    GNUNET_SCHEDULER_add_now (trigger_shutdown, NULL);
+    GNUNET_SERVER_receive_done (client, GNUNET_OK);
+    return;
+  }
+  sl = find_service (servicename);
+  if (sl == NULL)
+    {
+      signal_result (client, servicename, request_id, GNUNET_ARM_RESULT_IS_NOT_KNOWN);
+      GNUNET_SERVER_receive_done (client, GNUNET_OK);
+      return;
+    }
+  sl->is_default = GNUNET_NO;
+  if (GNUNET_YES == in_shutdown)
+    {
+      /* shutdown in progress */
+      signal_result (client, servicename, request_id, GNUNET_ARM_RESULT_IN_SHUTDOWN);
+      GNUNET_SERVER_receive_done (client, GNUNET_OK);
+      return;
+    }
+  if (sl->killing_client != NULL)
+    {
+      /* killing already in progress */
+      signal_result (client, servicename, request_id,
+          GNUNET_ARM_RESULT_IS_STOPPING_ALREADY);
+      GNUNET_SERVER_receive_done (client, GNUNET_OK);
+      return;
+    }
+  if (sl->proc == NULL)
+    {
+      /* process is down */
+      signal_result (client, servicename, request_id,
+          GNUNET_ARM_RESULT_IS_STOPPED_ALREADY);
+      GNUNET_SERVER_receive_done (client, GNUNET_OK);
+      return;
+    }
+  GNUNET_log (GNUNET_ERROR_TYPE_DEBUG,
+             "Sending kill signal to service `%s', waiting for process to die.\n",
+             servicename);
+  broadcast_status (servicename, GNUNET_ARM_SERVICE_STOPPING, NULL);
+  /* no signal_start - only when it's STOPPED */
+  sl->killed_at = GNUNET_TIME_absolute_get ();
+  if (0 != GNUNET_OS_process_kill (sl->proc, SIGTERM))
+    GNUNET_log_strerror (GNUNET_ERROR_TYPE_WARNING, "kill");
+  sl->killing_client = client;
+  sl->killing_client_request_id = request_id;
+  GNUNET_SERVER_client_keep (client);
   GNUNET_SERVER_receive_done (client, GNUNET_OK);
 }
 
 
 /**
- * Handle STOP-message.
+ * Handle LIST-message.
  *
  * @param cls closure (always NULL)
  * @param client identification of the client
  * @param message the actual message
- * @return GNUNET_OK to keep the connection open,
- *         GNUNET_SYSERR to close it (signal serious error)
  */
 static void
-handle_stop (void *cls,
-             struct GNUNET_SERVER_Client *client,
+handle_list (void *cls, struct GNUNET_SERVER_Client *client,
              const struct GNUNET_MessageHeader *message)
 {
-  const char *servicename;
-  uint16_t size;
+  struct GNUNET_ARM_ListResultMessage *msg;
+  struct GNUNET_ARM_Message *request;
+  size_t string_list_size;
+  size_t total_size;
+  struct ServiceList *sl;
+  uint16_t count;
+
+  if (NULL == client)
+    return;
+
+  request = (struct GNUNET_ARM_Message *) message;
+  count = 0;
+  string_list_size = 0;
+  /* first count the running processes get their name's size */
+  for (sl = running_head; sl != NULL; sl = sl->next)
+  {
+    if (sl->proc != NULL)
+    {
+      string_list_size += strlen (sl->name);
+      string_list_size += strlen (sl->binary);
+      string_list_size += 4;
+      count++;
+    }
+  }
+
+  total_size = sizeof (struct GNUNET_ARM_ListResultMessage)
+               + string_list_size;
+  msg = GNUNET_malloc (total_size);
+  msg->arm_msg.header.size = total_size;
+  msg->arm_msg.header.type = GNUNET_MESSAGE_TYPE_ARM_LIST_RESULT;
+  msg->arm_msg.request_id = GNUNET_ntohll (request->request_id);
+  msg->count = count;
+
+  char *pos = (char *)&msg[1];
+  for (sl = running_head; sl != NULL; sl = sl->next)
+  {
+    if (sl->proc != NULL)
+    {
+      size_t s = strlen (sl->name) + strlen (sl->binary) + 4;
+      GNUNET_snprintf(pos, s, "%s (%s)", sl->name, sl->binary);
+      pos += s;
+    }
+  }
 
-  size = ntohs (message->size);
-  size -= sizeof (struct GNUNET_MessageHeader);
-  servicename = (const char *) &message[1];
-  if ((size == 0) || (servicename[size - 1] != '\0'))
+  GNUNET_SERVER_notify_transmit_ready (client,
+                                       total_size,
+                                       GNUNET_TIME_UNIT_FOREVER_REL,
+                                       write_list_result, msg);
+  GNUNET_SERVER_receive_done (client, GNUNET_OK);
+}
+
+
+/**
+ * We are done with everything.  Stop remaining
+ * tasks, signal handler and the server.
+ */
+static void
+do_shutdown ()
+{
+  GNUNET_log (GNUNET_ERROR_TYPE_DEBUG, "Last shutdown phase\n");
+  if (NULL != notifier)
+  {
+    GNUNET_SERVER_notification_context_destroy (notifier);
+    notifier = NULL;
+  }
+  if (NULL != server)
     {
-      GNUNET_break (0);
-      GNUNET_SERVER_receive_done (client, GNUNET_SYSERR);
-      return;
+      GNUNET_SERVER_destroy (server);
+      server = NULL;
+    }
+  if (GNUNET_SCHEDULER_NO_TASK != child_death_task)
+    {
+      GNUNET_SCHEDULER_cancel (child_death_task);
+      child_death_task = GNUNET_SCHEDULER_NO_TASK;
     }
-  stop_service (client, servicename);
 }
 
 
+static unsigned int
+list_count (struct ServiceList *running_head)
+{
+  struct ServiceList *i;
+  unsigned int res = 0;
+
+  for (res = 0, i = running_head; i; i = i->next, res++)
+    GNUNET_log (GNUNET_ERROR_TYPE_DEBUG,
+               "%s\n",
+               i->name);
+  return res;
+}
+
 
 /**
- * Background task doing maintenance.
+ * Task run for shutdown.
  *
- * @param cls closure
+ * @param cls closure, NULL if we need to self-restart
  * @param tc context
  */
 static void
-maint (void *cls, const struct GNUNET_SCHEDULER_TaskContext *tc)
+shutdown_task (void *cls, const struct GNUNET_SCHEDULER_TaskContext *tc)
 {
   struct ServiceList *pos;
-  const char *statstr;
-  int statcode;
-  struct stat sbuf;
+  struct ServiceList *nxt;
+  struct ServiceListeningInfo *sli;
+
+  GNUNET_log (GNUNET_ERROR_TYPE_DEBUG,
+             "First shutdown phase\n");
+  if (GNUNET_SCHEDULER_NO_TASK != child_restart_task)
+  {
+    GNUNET_SCHEDULER_cancel (child_restart_task);
+    child_restart_task = GNUNET_SCHEDULER_NO_TASK;
+  }
+  in_shutdown = GNUNET_YES;
+  /* first, stop listening */
+  for (pos = running_head; NULL != pos; pos = pos->next)
+  {
+    while (NULL != (sli = pos->listen_head))
+      {
+       GNUNET_CONTAINER_DLL_remove (pos->listen_head,
+                                    pos->listen_tail, sli);
+       if (sli->accept_task != GNUNET_SCHEDULER_NO_TASK)
+         {
+           GNUNET_SCHEDULER_cancel (sli->accept_task);
+           sli->accept_task = GNUNET_SCHEDULER_NO_TASK;
+         }
+       GNUNET_break (GNUNET_OK ==
+                     GNUNET_NETWORK_socket_close (sli->listen_socket));
+       GNUNET_free (sli->service_addr);
+       GNUNET_free (sli);
+      }
+  }
+  /* then, shutdown all existing service processes */
+  nxt = running_head;
+  while (NULL != (pos = nxt))
+  {
+    nxt = pos->next;
+    if (pos->proc != NULL)
+    {
+      GNUNET_log (GNUNET_ERROR_TYPE_INFO,
+                 "Stopping service `%s'\n",
+                 pos->name);
+      pos->killed_at = GNUNET_TIME_absolute_get ();
+      if (0 != GNUNET_OS_process_kill (pos->proc, SIGTERM))
+       GNUNET_log_strerror (GNUNET_ERROR_TYPE_WARNING, "kill");
+    }
+    else
+    {
+      free_service (pos);
+    }
+  }
+  /* finally, should all service processes be already gone, terminate for real */
+  if (running_head == NULL)
+    do_shutdown ();
+  else
+    GNUNET_log (GNUNET_ERROR_TYPE_DEBUG,
+               "Delaying shutdown, have %u childs still running\n",
+               list_count (running_head));
+}
+
 
+/**
+ * Task run whenever it is time to restart a child that died.
+ *
+ * @param cls closure, always NULL
+ * @param tc context
+ */
+static void
+delayed_restart_task (void *cls,
+                     const struct GNUNET_SCHEDULER_TaskContext *tc)
+{
+  struct ServiceList *sl;
+  struct GNUNET_TIME_Relative lowestRestartDelay;
+  struct ServiceListeningInfo *sli;
+
+  child_restart_task = GNUNET_SCHEDULER_NO_TASK;
   if (0 != (tc->reason & GNUNET_SCHEDULER_REASON_SHUTDOWN))
+    return;
+  GNUNET_assert (GNUNET_NO == in_shutdown);
+  lowestRestartDelay = GNUNET_TIME_UNIT_FOREVER_REL;
+
+  /* check for services that need to be restarted due to
+   * configuration changes or because the last restart failed */
+  for (sl = running_head; NULL != sl; sl = sl->next)
+  {
+    if (NULL != sl->proc)
+      continue;
+    /* service is currently not running */
+    if (0 == GNUNET_TIME_absolute_get_remaining (sl->restart_at).rel_value_us)
     {
-      GNUNET_log (GNUNET_ERROR_TYPE_INFO, _("Stopping all services\n"));
-      while (NULL != (pos = running))
-        {
-          running = pos->next;
-          if (0 != PLIBC_KILL (pos->pid, SIGTERM))
-            GNUNET_log_strerror (GNUNET_ERROR_TYPE_WARNING, "kill");
-          if (GNUNET_OK != GNUNET_OS_process_wait(pos->pid))
-            GNUNET_log_strerror (GNUNET_ERROR_TYPE_WARNING, "waitpid");
-          free_entry (pos);
-        }
+      /* restart is now allowed */
+      if (sl->is_default)
+      {
+       /* process should run by default, start immediately */
+       GNUNET_log (GNUNET_ERROR_TYPE_INFO,
+                   _("Restarting service `%s'.\n"), sl->name);
+       start_process (sl, NULL, 0);
+      }
+      else
+      {
+       /* process is run on-demand, ensure it is re-started if there is demand */
+       for (sli = sl->listen_head; NULL != sli; sli = sli->next)
+         if (GNUNET_SCHEDULER_NO_TASK == sli->accept_task)
+         {
+           /* accept was actually paused, so start it again */
+           sli->accept_task =
+             GNUNET_SCHEDULER_add_read_net
+             (GNUNET_TIME_UNIT_FOREVER_REL, sli->listen_socket,
+              &accept_connection, sli);
+         }
+      }
+    }
+    else
+    {
+      /* update calculation for earliest time to reactivate a service */
+      lowestRestartDelay =
+       GNUNET_TIME_relative_min (lowestRestartDelay,
+                                 GNUNET_TIME_absolute_get_remaining
+                                 (sl->restart_at));
+    }
+  }
+  if (lowestRestartDelay.rel_value_us != GNUNET_TIME_UNIT_FOREVER_REL.rel_value_us)
+  {
+    GNUNET_log (GNUNET_ERROR_TYPE_DEBUG,
+               "Will restart process in %s\n",
+               GNUNET_STRINGS_relative_time_to_string (lowestRestartDelay, GNUNET_YES));
+    child_restart_task =
+      GNUNET_SCHEDULER_add_delayed_with_priority (lowestRestartDelay,
+                                                 GNUNET_SCHEDULER_PRIORITY_IDLE,
+                                                 &delayed_restart_task, NULL);
+  }
+}
+
+
+/**
+ * Task triggered whenever we receive a SIGCHLD (child
+ * process died).
+ *
+ * @param cls closure, NULL if we need to self-restart
+ * @param tc context
+ */
+static void
+maint_child_death (void *cls, const struct GNUNET_SCHEDULER_TaskContext *tc)
+{
+  struct ServiceList *pos;
+  struct ServiceList *next;
+  struct ServiceListeningInfo *sli;
+  const char *statstr;
+  int statcode;
+  int ret;
+  char c[16];
+  enum GNUNET_OS_ProcessStatusType statusType;
+  unsigned long statusCode;
+  const struct GNUNET_DISK_FileHandle *pr;
+
+  pr = GNUNET_DISK_pipe_handle (sigpipe, GNUNET_DISK_PIPE_END_READ);
+  child_death_task = GNUNET_SCHEDULER_NO_TASK;
+  if (0 == (tc->reason & GNUNET_SCHEDULER_REASON_READ_READY))
+    {
+      /* shutdown scheduled us, ignore! */
+      child_death_task =
+       GNUNET_SCHEDULER_add_read_file (GNUNET_TIME_UNIT_FOREVER_REL,
+                                       pr, &maint_child_death, NULL);
       return;
     }
-  GNUNET_SCHEDULER_add_delayed (tc->sched,
-                                GNUNET_YES,
-                                GNUNET_SCHEDULER_PRIORITY_IDLE,
-                                GNUNET_SCHEDULER_NO_PREREQUISITE_TASK,
-                                MAINT_FREQUENCY, &maint, cfg);
+  /* consume the signal */
+  GNUNET_break (0 < GNUNET_DISK_file_read (pr, &c, sizeof (c)));
 
   /* check for services that died (WAITPID) */
-  for (pos = running; pos != NULL; pos = pos->next)
+  next = running_head;
+  while (NULL != (pos = next))
     {
-      enum GNUNET_OS_ProcessStatusType statusType;
-      unsigned long statusCode;
+      next = pos->next;
 
-      if (GNUNET_OS_process_status(pos->pid, &statusType, &statusCode) != GNUNET_OK)
+      if (pos->proc == NULL)
       {
-        GNUNET_log_strerror(GNUNET_ERROR_TYPE_ERROR, "GNUNET_OS_process_status");
-        continue;
+       if (GNUNET_YES == in_shutdown)
+         free_service (pos);
+       continue;
+      }
+      if ((GNUNET_SYSERR ==
+          (ret =
+           GNUNET_OS_process_status (pos->proc, &statusType, &statusCode)))
+         || ((ret == GNUNET_NO) || (statusType == GNUNET_OS_PROCESS_STOPPED)
+             || (statusType == GNUNET_OS_PROCESS_RUNNING)))
+       continue;
+      if (statusType == GNUNET_OS_PROCESS_EXITED)
+      {
+       statstr = _( /* process termination method */ "exit");
+       statcode = statusCode;
       }
-
-      if (statusType == GNUNET_OS_PROCESS_STOPPED || statusType == GNUNET_OS_PROCESS_RUNNING)
-        continue;
-      else if (statusType == GNUNET_OS_PROCESS_EXITED)
-        {
-          statstr = _( /* process termination method */ "exit");
-          statcode = statusCode;
-        }
       else if (statusType == GNUNET_OS_PROCESS_SIGNALED)
-        {
-          statstr = _( /* process termination method */ "signal");
-          statcode = statusCode;
-        }
+      {
+       statstr = _( /* process termination method */ "signal");
+       statcode = statusCode;
+      }
       else
+      {
+       statstr = _( /* process termination method */ "unknown");
+       statcode = 0;
+      }
+      if (0 != pos->killed_at.abs_value_us)
+      {
+       GNUNET_log (GNUNET_ERROR_TYPE_INFO,
+                   _("Service `%s' took %s to terminate\n"),
+                   pos->name,
+                   GNUNET_STRINGS_relative_time_to_string (GNUNET_TIME_absolute_get_duration (pos->killed_at), GNUNET_YES));
+      }
+      GNUNET_OS_process_destroy (pos->proc);
+      pos->proc = NULL;
+      broadcast_status (pos->name, GNUNET_ARM_SERVICE_STOPPED, NULL);
+      if (NULL != pos->killing_client)
+      {
+        signal_result (pos->killing_client, pos->name,
+            pos->killing_client_request_id, GNUNET_ARM_RESULT_STOPPED);
+        GNUNET_SERVER_client_drop (pos->killing_client);
+        pos->killing_client = NULL;
+        pos->killing_client_request_id = 0;
+      }
+      if (GNUNET_YES != in_shutdown)
+      {
+        if ((statusType == GNUNET_OS_PROCESS_EXITED) && (statcode == 0))
         {
-          statstr = _( /* process termination method */ "unknown");
-          statcode = 0;
-        }
-      if (NULL != pos->kill_continuation)
+          /* process terminated normally, allow restart at any time */
+          pos->restart_at.abs_value_us = 0;
+          GNUNET_log (GNUNET_ERROR_TYPE_INFO,
+              _("Service `%s' terminated normally, will restart at any time\n"),
+              pos->name);
+          /* process can still be re-started on-demand, ensure it is re-started if there is demand */
+          for (sli = pos->listen_head; NULL != sli; sli = sli->next)
+          {
+            GNUNET_break (GNUNET_SCHEDULER_NO_TASK == sli->accept_task);
+            sli->accept_task =
+                GNUNET_SCHEDULER_add_read_net (GNUNET_TIME_UNIT_FOREVER_REL,
+                    sli->listen_socket, &accept_connection, sli);
+          }
+       }
+        else
         {
-          pos->kill_continuation (pos->kill_continuation_cls, pos);
+         if (0 == (tc->reason & GNUNET_SCHEDULER_REASON_SHUTDOWN))
+           GNUNET_log (GNUNET_ERROR_TYPE_INFO,
+               _("Service `%s' terminated with status %s/%d, will restart in %s\n"),
+                pos->name, statstr, statcode,
+                GNUNET_STRINGS_relative_time_to_string (pos->backoff, GNUNET_YES));
+         /* schedule restart */
+         pos->restart_at = GNUNET_TIME_relative_to_absolute (pos->backoff);
+         pos->backoff = GNUNET_TIME_STD_BACKOFF (pos->backoff);
+          if (GNUNET_SCHEDULER_NO_TASK != child_restart_task)
+            GNUNET_SCHEDULER_cancel (child_restart_task);
+          child_restart_task = GNUNET_SCHEDULER_add_with_priority (
+            GNUNET_SCHEDULER_PRIORITY_IDLE, &delayed_restart_task, NULL);
         }
+      }
       else
-        {
-          GNUNET_log (GNUNET_ERROR_TYPE_WARNING,
-                      _
-                      ("Service `%s' terminated with status %s/%d, will try to restart it!\n"),
-                      pos->name, statstr, statcode);
-          /* schedule restart */
-          pos->pid = 0;
-        }
+      {
+        free_service (pos);
+      }
     }
+  child_death_task = GNUNET_SCHEDULER_add_read_file (
+      GNUNET_TIME_UNIT_FOREVER_REL, pr, &maint_child_death, NULL);
+  if ((NULL == running_head) && (GNUNET_YES == in_shutdown))
+    do_shutdown ();
+  else if (GNUNET_YES == in_shutdown)
+    GNUNET_log (GNUNET_ERROR_TYPE_DEBUG,
+        "Delaying shutdown after child's death, still have %u children\n",
+        list_count (running_head));
 
-  /* check for services that need to be restarted due to
-     configuration changes or because the last restart failed */
-  pos = running;
-  while (pos != NULL)
+}
+
+
+/**
+ * Signal handler called for SIGCHLD.  Triggers the
+ * respective handler by writing to the trigger pipe.
+ */
+static void
+sighandler_child_death ()
+{
+  static char c;
+  int old_errno = errno;       /* back-up errno */
+
+  GNUNET_break (1 ==
+               GNUNET_DISK_file_write (GNUNET_DISK_pipe_handle
+                                       (sigpipe, GNUNET_DISK_PIPE_END_WRITE),
+                                       &c, sizeof (c)));
+  errno = old_errno;           /* restore errno */
+}
+
+
+/**
+ * Setup our service record for the given section in the configuration file
+ * (assuming the section is for a service).
+ *
+ * @param cls unused
+ * @param section a section in the configuration file
+ * @return #GNUNET_OK (continue)
+ */
+static void
+setup_service (void *cls, const char *section)
+{
+  struct ServiceList *sl;
+  char *binary;
+  char *config;
+  struct stat sbuf;
+  struct sockaddr **addrs;
+  socklen_t *addr_lens;
+  int ret;
+  unsigned int i;
+
+  if (strcasecmp (section, "arm") == 0)
+    return;
+  if (GNUNET_OK !=
+      GNUNET_CONFIGURATION_get_value_string (cfg, section, "BINARY", &binary))
     {
-      if ((0 == STAT (pos->config, &sbuf)) && (pos->mtime < sbuf.st_mtime))
-        {
-          GNUNET_log (GNUNET_ERROR_TYPE_INFO,
-                      _
-                      ("Restarting service `%s' due to configuration file change.\n"));
-          if (0 != PLIBC_KILL (pos->pid, SIGTERM))
-            GNUNET_log_strerror (GNUNET_ERROR_TYPE_WARNING, "kill");
-        }
-      if (pos->pid == 0)
-        {
-          GNUNET_log (GNUNET_ERROR_TYPE_INFO,
-                      _("Restarting service `%s'.\n"), pos->name);
-          /* FIXME: should have some exponentially
-             increasing timer to avoid tight restart loops */
-          start_process (pos);
-        }
-      pos = pos->next;
+      /* not a service section */
+      return;
+    }
+  sl = find_service (section);
+  if (NULL != sl)
+  {
+    /* got the same section twice!? */
+    GNUNET_break (0);
+    GNUNET_free (binary);
+    return;
+  }
+  config = NULL;
+  if (( (GNUNET_OK !=
+        GNUNET_CONFIGURATION_get_value_filename (cfg, section, "CONFIG",
+                                                 &config)) &&
+       (GNUNET_OK !=
+        GNUNET_CONFIGURATION_get_value_filename (cfg, "PATHS", "DEFAULTCONFIG",
+                                                 &config)) ) ||
+      (0 != STAT (config, &sbuf)))
+  {
+    if (NULL != config)
+    {
+      GNUNET_log_config_invalid (GNUNET_ERROR_TYPE_WARNING,
+                                section, "CONFIG",
+                                STRERROR (errno));
+      GNUNET_free (config);
+      config = NULL;
     }
+  }
+  sl = GNUNET_new (struct ServiceList);
+  sl->name = GNUNET_strdup (section);
+  sl->binary = binary;
+  sl->config = config;
+  sl->backoff = GNUNET_TIME_UNIT_MILLISECONDS;
+  sl->restart_at = GNUNET_TIME_UNIT_FOREVER_ABS;
+#if WINDOWS
+  sl->pipe_control = GNUNET_YES;
+#else
+  if (GNUNET_CONFIGURATION_have_value (cfg, section, "PIPECONTROL"))
+    sl->pipe_control = GNUNET_CONFIGURATION_get_value_yesno (cfg, section, "PIPECONTROL");
+#endif
+  GNUNET_CONTAINER_DLL_insert (running_head, running_tail, sl);
+  if (GNUNET_YES !=
+      GNUNET_CONFIGURATION_get_value_yesno (cfg, section, "AUTOSTART"))
+    return;
+  if (0 >= (ret = GNUNET_SERVICE_get_server_addresses (section, cfg,
+                                                      &addrs, &addr_lens)))
+    return;
+  /* this will free (or capture) addrs[i] */
+  for (i = 0; i < ret; i++)
+    create_listen_socket (addrs[i], addr_lens[i], sl);
+  GNUNET_free (addrs);
+  GNUNET_free (addr_lens);
 }
 
 
 /**
- * List of handlers for the messages understood by this
- * service.
+ * A client connected, add it to the notification context.
+ *
+ * @param cls closure
+ * @param client identification of the client
  */
-static struct GNUNET_SERVER_MessageHandler handlers[] = {
-  {&handle_start, NULL, GNUNET_MESSAGE_TYPE_ARM_START, 0},
-  {&handle_stop, NULL, GNUNET_MESSAGE_TYPE_ARM_STOP, 0},
-  {NULL, NULL, 0, 0}
-};
+static void
+handle_client_connecting (void *cls, struct GNUNET_SERVER_Client *client)
+{
+  /* All clients are considered to be of the "monitor" kind
+   * (that is, they don't affect ARM shutdown).
+   */
+  if (NULL != client)
+    GNUNET_SERVER_client_mark_monitor (client);
+}
+
+
+/**
+ * Handle MONITOR-message.
+ *
+ * @param cls closure (always NULL)
+ * @param client identification of the client
+ * @param message the actual message
+ * @return #GNUNET_OK to keep the connection open,
+ *         #GNUNET_SYSERR to close it (signal serious error)
+ */
+static void
+handle_monitor (void *cls, struct GNUNET_SERVER_Client *client,
+            const struct GNUNET_MessageHeader *message)
+{
+  /* Removal is handled by the server implementation, internally. */
+  if ((NULL != client) && (NULL != notifier))
+  {
+    GNUNET_SERVER_notification_context_add (notifier, client);
+    broadcast_status ("arm", GNUNET_ARM_SERVICE_MONITORING_STARTED, client);
+    GNUNET_SERVER_receive_done (client, GNUNET_OK);
+  }
+}
 
 
 /**
  * Process arm requests.
  *
  * @param cls closure
- * @param s scheduler to use
- * @param server the initialized server
+ * @param serv the initialized server
  * @param c configuration to use
  */
 static void
-run (void *cls,
-     struct GNUNET_SCHEDULER_Handle *s,
-     struct GNUNET_SERVER_Handle *server,
-     struct GNUNET_CONFIGURATION_Handle *c)
+run (void *cls, struct GNUNET_SERVER_Handle *serv,
+     const struct GNUNET_CONFIGURATION_Handle *c)
 {
+  static const struct GNUNET_SERVER_MessageHandler handlers[] = {
+    {&handle_start, NULL, GNUNET_MESSAGE_TYPE_ARM_START, 0},
+    {&handle_stop, NULL, GNUNET_MESSAGE_TYPE_ARM_STOP, 0},
+    {&handle_monitor, NULL, GNUNET_MESSAGE_TYPE_ARM_MONITOR,
+     sizeof (struct GNUNET_MessageHeader)},
+    {&handle_list, NULL, GNUNET_MESSAGE_TYPE_ARM_LIST,
+     sizeof (struct GNUNET_ARM_Message)},
+    {NULL, NULL, 0, 0}
+  };
   char *defaultservices;
-  char *pos;
+  const char *pos;
+  struct ServiceList *sl;
 
-  GNUNET_log (GNUNET_ERROR_TYPE_INFO, "Starting...\n");
   cfg = c;
-  sched = s;
+  server = serv;
+  GNUNET_assert (serv != NULL);
+  GNUNET_SCHEDULER_add_delayed (GNUNET_TIME_UNIT_FOREVER_REL, &shutdown_task,
+                               NULL);
+  child_death_task =
+    GNUNET_SCHEDULER_add_read_file (GNUNET_TIME_UNIT_FOREVER_REL,
+                                   GNUNET_DISK_pipe_handle (sigpipe,
+                                                            GNUNET_DISK_PIPE_END_READ),
+                                   &maint_child_death, NULL);
+
   if (GNUNET_OK !=
-      GNUNET_CONFIGURATION_get_value_string (cfg,
-                                             "ARM",
-                                             "GLOBAL_PREFIX",
-                                             &prefix_command))
+      GNUNET_CONFIGURATION_get_value_string (cfg, "ARM", "GLOBAL_PREFIX",
+                                            &prefix_command))
     prefix_command = GNUNET_strdup ("");
+  if (GNUNET_OK !=
+      GNUNET_CONFIGURATION_get_value_string (cfg, "ARM", "GLOBAL_POSTFIX",
+                                            &final_option))
+    final_option = GNUNET_strdup ("");
+
+  GNUNET_CONFIGURATION_iterate_sections (cfg, &setup_service, NULL);
+
   /* start default services... */
   if (GNUNET_OK ==
-      GNUNET_CONFIGURATION_get_value_string (cfg,
-                                             "ARM",
-                                             "DEFAULTSERVICES",
-                                             &defaultservices))
+      GNUNET_CONFIGURATION_get_value_string (cfg, "ARM", "DEFAULTSERVICES",
+                                            &defaultservices))
     {
-#if DEBUG_ARM
-      GNUNET_log (GNUNET_ERROR_TYPE_DEBUG,
-                  "Starting default services `%s'\n", defaultservices);
-#endif
-      pos = strtok (defaultservices, " ");
-      while (pos != NULL)
-        {
-          start_service (NULL, pos);
-          pos = strtok (NULL, " ");
-        }
+      GNUNET_log (GNUNET_ERROR_TYPE_INFO,
+                 _("Starting default services `%s'\n"), defaultservices);
+      if (0 < strlen (defaultservices))
+       {
+         for (pos = strtok (defaultservices, " "); NULL != pos;
+              pos = strtok (NULL, " "))
+           {
+             sl = find_service (pos);
+             if (NULL == sl)
+               {
+                 GNUNET_log (GNUNET_ERROR_TYPE_ERROR,
+                             _
+                             ("Default service `%s' not configured correctly!\n"),
+                             pos);
+                 continue;
+               }
+             sl->is_default = GNUNET_YES;
+             start_process (sl, NULL, 0);
+           }
+       }
       GNUNET_free (defaultservices);
     }
   else
     {
-#if DEBUG_ARM
-      GNUNET_log (GNUNET_ERROR_TYPE_DEBUG,
-                  "No default services configured.\n");
-#endif
+      GNUNET_log (GNUNET_ERROR_TYPE_INFO,
+                 _
+                 ("No default services configured, GNUnet will not really start right now.\n"));
     }
 
+  notifier =
+      GNUNET_SERVER_notification_context_create (server, MAX_NOTIFY_QUEUE);
+  GNUNET_SERVER_connect_notify (server, handle_client_connecting, NULL);
   /* process client requests */
   GNUNET_SERVER_add_handlers (server, handlers);
-
-  /* manage services */
-  GNUNET_SCHEDULER_add_delayed (sched,
-                                GNUNET_YES,
-                                GNUNET_SCHEDULER_PRIORITY_IDLE,
-                                GNUNET_SCHEDULER_NO_PREREQUISITE_TASK,
-                                MAINT_FREQUENCY, &maint, NULL);
 }
 
 
@@ -706,9 +1447,38 @@ run (void *cls,
 int
 main (int argc, char *const *argv)
 {
-  return (GNUNET_OK ==
-          GNUNET_SERVICE_run (argc,
-                              argv, "arm", &run, NULL, NULL, NULL)) ? 0 : 1;
+  int ret;
+  struct GNUNET_SIGNAL_Context *shc_chld;
+
+  sigpipe = GNUNET_DISK_pipe (GNUNET_NO, GNUNET_NO, GNUNET_NO, GNUNET_NO);
+  GNUNET_assert (sigpipe != NULL);
+  shc_chld =
+    GNUNET_SIGNAL_handler_install (GNUNET_SIGCHLD, &sighandler_child_death);
+  ret =
+    (GNUNET_OK ==
+     GNUNET_SERVICE_run (argc, argv, "arm",
+                        GNUNET_SERVICE_OPTION_MANUAL_SHUTDOWN, &run, NULL)) ? 0 : 1;
+  GNUNET_SIGNAL_handler_uninstall (shc_chld);
+  shc_chld = NULL;
+  GNUNET_DISK_pipe_close (sigpipe);
+  sigpipe = NULL;
+  return ret;
+}
+
+
+#ifdef LINUX
+#include <malloc.h>
+
+/**
+ * MINIMIZE heap size (way below 128k) since this process doesn't need much.
+ */
+void __attribute__ ((constructor)) GNUNET_ARM_memory_init ()
+{
+  mallopt (M_TRIM_THRESHOLD, 4 * 1024);
+  mallopt (M_TOP_PAD, 1 * 1024);
+  malloc_trim (0);
 }
+#endif
+
 
 /* end of gnunet-service-arm.c */