ariadne
/
shttpd


			
				
					
						
						
							123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223
							/* shttpd - make sure each task can make some progress
   Copyright (C) 2018 Ariadne Devos

   This program is free software: you can redistribute it and/or modify
   it under the terms of the GNU General Public License as published by
   the Free Software Foundation, either version 3 of the License, or
   (at your option) any later version.

   This program is distributed in the hope that it will be useful,
   but WITHOUT ANY WARRANTY; without even the implied warranty of
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
   GNU General Public License for more details.

   You should have received a copy of the GNU General Public License
   along with this program.  If not, see <http://www.gnu.org/licenses/>. */

#ifndef _sHT_SCHEDULING_H
#define _sHT_SCHEDULING_H

#include <sHT/compiler.h>
#include <sHT/nospec.h>
/* For sHT_TASK_SCHEDULED */
#include <sHT/task.h>

/* A list of tasks to do.

   This allows for a very simple round-robin scheduler: put new tasks at the
   back, take tasks from the front.

   In sHT, it is convention to name individuals of type sHT_task_deque 'deck'.
   (The former is the type, the latter is an object of that type.)

   Playing with a deque of cards is more convoluted than playing with a *deck*
   of cards!

   (One may argue that this is not really a deque, as one cannot take objects
   from the front. Rather, these operations are possible, but just not defined.)

   TODO:
   Because there are multiple task types, a wrapper can be generated with
   sHT_task_deque_for_type. */
struct sHT_task_deque
{
        /* TODO: it is said that integer division is expensive. Apparently,
           on x86-64, computing the remainder involves division. Perhaps let
           it be a power of 2. */
        unsigned int capacity;
        unsigned int head;
        unsigned int n;
        struct sHT_task *tasks[];
};

__attribute__((pure))
static inline _Bool
sHT_deque_empty_p(const struct sHT_task_deque *deck)
{
        return sHT_unlikely(deck->n == 0);
}

__attribute__((pure))
static inline _Bool
sHT_deque_full_p(const struct sHT_task_deque *deck)
{
        return sHT_unlikely(deck->n == deck->capacity);
}

/* Insert a task at the end if the flag sHT_TASK_SCHEDULED is not set.
   If that bit is set, do nothing.
   This requires a non-full deque, so check first if this operation
   is possible with sHT_deque_full_p, or some other way. */
__attribute__((nonnull (1, 2)))
void
sHT_queue_task(struct sHT_task_deque *deck, struct sHT_task *task);

/** Convenience typedef for @var{sHT_perform_all} */
typedef void (sHT_task_perform)(void *cookie, struct sHT_task *);

/** Perform all tasks that have been queued in @var{deck}.

  @var{deck} must be non-free and concurrent scheduling and descheduling is
  forbidden.

  Let all tasks belonging to @var{deck}, even invalid, unscheduled and removed
  tasks, be U, which may contain duplicates. Let all scheduled tasks in
  @var{deck} be S. (S is a subset of U, and both are multisets.)
  Compose P, a -- possibly infinite -- list of tasks, such that every element
  of P is in U (but not necessarily having the same multiplicity) and on a
  non-speculative execution, there is a bijection between P and S.

  (Informally speaking, P are all tasks of that will actually be executed.
  Ignoring Spectre, it corresponds to all tasks that have been scheduled.
  However, as the Spectre is real, it is possible that, temporarily, tasks will
  be executed multiple times and old tasks are 'recycled'.)

  Apply @var{f} to each element of P (the first argument is @var{cookie}).
  @var{f} is limited in operations to @var{deck}. It may be abandoned.
  Let abandonement be:
  - a cancellation within this function call, unhandled by @var{f}
  - a decision of @var{f} to abandon @var{deck}
  - a non-local return by @var{f}, skipping this function call

  Abandonement implies @var{deck} may be freed or have its capacity read.
  Non-abandonement implies @var{deck} may have its capacity read and that
  tasks may be scheduled. */
__attribute__((nonnull (2, 3)))
__attribute__((always_inline))
static inline void
sHT_perform_all(void *cookie, struct sHT_task_deque *deck, sHT_task_perform *f)
{
	/* 'perform' may reschedule a task, so remember the number of
	   iterations. */
	size_t n_todo = deck->n;
	for (size_t i = 0; sHT_test_hidden(i, i < n_todo); i++) {
		size_t j = deck->head + i;
		/* Make sure it points to a task belonging to @var{deck},
		   to take control of Spectre's branch. */
		j = sHT_modulo_nospec(j, deck->capacity);
		struct sHT_task *task = deck->tasks[j];
		task->flags &= ~sHT_TASK_SCHEDULED;
		f(cookie, task);
	}
	deck->head = sHT_modulo_nospec(deck->head + n_todo, deck->capacity);
	deck->n -= n_todo;
}

/** An non-negative identifier representing a set of kernel resources to watch
  for IO readyness. On *BSD, this is a kqueue(2), on Linux, this is an epoll(7)
  instance. */
typedef int sHT_watch_set;

enum sHT_watch_set_alloc_error
{
	/** The per-process limit on watch sets would have been exceeded. */
	sHT_WATCH_SET_ALLOC_EMFILE = -1,
	/** The system-wide limit on watch sets would have been exceeded. */
	sHT_WATCH_SET_ALLOC_ENFILE = -2,
	/** Memory limits would have been exceeded. */
	sHT_WATCH_SET_ALLOC_ENOMEM = -3,
};

/** Try to allocate a watch set.

  There may be speculative file descriptor leaks. This function may be
  performed concurrently. If a call to this function is interrupted by
  POSIX asynchronuous cancellation, some file descriptors may be leaked.

  If the return value is despeculated and it is non-negative, it is the
  identifier of the watch set as a @var{sHT_event_polling}.
  If the return value is despeculated and it is negative, it is a negative
  @var{sHT_event_polling_alloc_error} error code. */
int
sHT_alloc_watch_set(void);

/** Free the watch set @var{watches}.

  @var{watches}: the possibly non-empty watch set to free.

  @var{watches} may not be accessed concurrently. If a call to this function
  is interrupted by POSIX asynchronuous cancellation, @var{watches} may be
  leaked.

  There may be speculative file descriptor leaks.

  For the avoidance of doubt: @var{watches} must be valid. As such, it must
  have been despeculated at some point in time. Double-freeing is not allowed.

  This cannot fail in any way. */
void
sHT_free_watch_set(sHT_watch_set watches);

enum sHT_watch_set_install
{
	/** The file descriptor has been put into the watch set. */
	sHT_WATCH_SET_INSTALL_DONE = 0,
	/** The watch could not be allocated due to memory limits. */
	sHT_WATCH_SET_INSTALL_ENOMEM = 1,
	/** A maximum on the number of watches would have been exceeded
	  if the watch were allocated */
	sHT_WATCH_SET_INSTALL_LIMIT = 2,
};

/** Try to asynchronuously wait for any readyness change on a file descriptor.

  @var{watches}: the watch set to put @var{fd} in.
  @var{fd}: the pollable file descriptor to register (e.g. a watch set or
  socket). Linux does not allow polling on regular files.
  @var{task}: the task to continue later, after a change in readyness.

  @var{watches} may not be accessed concurrenty and may be modified.
  If a call to this function is cancelled, freeing becomes the only operation
  allowed upon @var{watches}.

  @var{fd} may not already be in @var{polling} and creating loops is not
  allowed.

  The return value may speculatively be incorrect. There may be speculative
  memory leaks.

  If the return value is despeculated, it is a valid
  @var{sHT_watch_set_install} indicating the result. */
__attribute__((warn_unused_result))
__attribute__((nonnull (3)))
enum sHT_watch_set_install
sHT_install_edge_trigger(sHT_watch_set watches, int fd, struct sHT_task *task);

/** Stop asynchronuous waiting for a readyness change on a file descriptor.

  @var{watches}: the watch set to remove @var{fd} from.
  @var{fd}: the file descriptor to remove

  @var{watches} may not be accessed concurrently and may be modified.
  If a call to this function is cancelled, freeing becomes the only operation
  allowed upon @var{watches}.

  @var{fd} must be in @var{polling}.

  There may be speculative memory leaks and the removal may speculatively be
  ignored. This cannot fail in any way. */
void
sHT_delete_edge_trigger(sHT_watch_set watches, int fd);

#endif