/* -*- Mode: C; c-basic-offset: 2; indent-tabs-mode: nil -*- */
/* vim: set filetype=c tabstop=2 shiftwidth=2 expandtab: */

/*
 * queue.d - waiting queue for threads
 *
 * Copyright (c) 2011 Juan Jose Garcia Ripoll
 *
 * See file 'LICENSE' for the copyright details.
 *
 */

#ifdef HAVE_SCHED_H
#include <sched.h>
#endif
#include <signal.h>
#include <ecl/ecl.h>
#include <ecl/internal.h>
#include "threads/ecl_atomics.h"

void ECL_INLINE
ecl_process_yield()
{
#if defined(ECL_WINDOWS_THREADS)
  Sleep(0);
#elif defined(HAVE_SCHED_H)
  sched_yield();
#else
  ecl_musleep(0.0, 1);*/
#endif
    }

void ECL_INLINE
ecl_get_spinlock(cl_env_ptr the_env, cl_object *lock)
{
  cl_object own_process = the_env->own_process;
  while (!AO_compare_and_swap_full((AO_t*)lock, (AO_t)ECL_NIL,
                                   (AO_t)own_process)) {
    ecl_process_yield();
  }
}

void ECL_INLINE
ecl_giveup_spinlock(cl_object *lock)
{
  AO_store((AO_t*)lock, (AO_t)ECL_NIL);
}

static ECL_INLINE void
wait_queue_nconc(cl_env_ptr the_env, cl_object q, cl_object new_tail)
{
  ecl_get_spinlock(the_env, &q->queue.spinlock);
  q->queue.list = ecl_nconc(q->queue.list, new_tail);
  ecl_giveup_spinlock(&q->queue.spinlock);
}

static ECL_INLINE cl_object
wait_queue_pop_all(cl_env_ptr the_env, cl_object q)
{
  cl_object output;
  ecl_disable_interrupts_env(the_env);
  {
    ecl_get_spinlock(the_env, &q->queue.spinlock);
    output = q->queue.list;
    q->queue.list = ECL_NIL;
    ecl_giveup_spinlock(&q->queue.spinlock);
  }
  ecl_enable_interrupts_env(the_env);
  return output;
}

static ECL_INLINE void
wait_queue_delete(cl_env_ptr the_env, cl_object q, cl_object item)
{
  ecl_get_spinlock(the_env, &q->queue.spinlock);
  q->queue.list = ecl_delete_eq(item, q->queue.list);
  ecl_giveup_spinlock(&q->queue.spinlock);
}

/*----------------------------------------------------------------------
 * THREAD SCHEDULER & WAITING
 */

static cl_object
bignum_set_time(cl_object bignum, struct ecl_timeval *time)
{
  _ecl_big_set_index(bignum, time->tv_sec);
  _ecl_big_mul_ui(bignum, bignum, 1000);
  _ecl_big_add_ui(bignum, bignum, (time->tv_usec + 999) / 1000);
  return bignum;
}

static cl_object
elapsed_time(struct ecl_timeval *start)
{
  cl_object delta_big = _ecl_big_register0();
  cl_object aux_big = _ecl_big_register1();
  struct ecl_timeval now;
  ecl_get_internal_real_time(&now);
  bignum_set_time(aux_big, start);
  bignum_set_time(delta_big, &now);
  _ecl_big_sub(delta_big, delta_big, aux_big);
  _ecl_big_register_free(aux_big);
  return delta_big;
}

static double
waiting_time(cl_index iteration, struct ecl_timeval *start)
{
  /* Waiting time is smaller than 0.10 s */
  double time;
  cl_object top = ecl_make_fixnum(10 * 1000);
  cl_object delta_big = elapsed_time(start);
  _ecl_big_div_ui(delta_big, delta_big, iteration);
  if (ecl_number_compare(delta_big, top) < 0) {
    time = ecl_to_double(delta_big) * 1.5;
  } else {
    time = 0.10;
  }
  _ecl_big_register_free(delta_big);
  return time;
}

static cl_object
ecl_wait_on_timed(cl_env_ptr env, cl_object (*condition)(cl_env_ptr, cl_object), cl_object o)
{
  volatile const cl_env_ptr the_env = env;
  volatile cl_object own_process = the_env->own_process;
  volatile cl_object record;
  volatile cl_object output;
  cl_fixnum iteration = 0;
  struct ecl_timeval start;
  ecl_get_internal_real_time(&start);

  /* This spinlock is here because the default path (fair) is
   * too slow */
  for (iteration = 0; iteration < 10; iteration++) {
    cl_object output = condition(the_env,o);
    if (output != ECL_NIL)
      return output;
  }

  /* 0) We reserve a record for the queue. In order to avoid
   * using the garbage collector, we reuse records */
  record = own_process->process.queue_record;
  unlikely_if (record == ECL_NIL) {
    record = ecl_list1(own_process);
  } else {
    own_process->process.queue_record = ECL_NIL;
  }

  ecl_bds_bind(the_env, @'ext::*interrupts-enabled*', ECL_NIL);
  ECL_UNWIND_PROTECT_BEGIN(the_env) {
    /* 2) Now we add ourselves to the queue. In order to
     * avoid a call to the GC, we try to reuse records. */
    print_lock("adding to queue", o);
    own_process->process.woken_up = ECL_NIL;
    wait_queue_nconc(the_env, o, record);
    ecl_bds_bind(the_env, @'ext::*interrupts-enabled*', ECL_T);
    ecl_check_pending_interrupts(the_env);

    /* 3) Unlike the sigsuspend() implementation, this
     * implementation does not block signals and the
     * wakeup event might be lost before the sleep
     * function is invoked. We must thus spin over short
     * intervals of time to ensure that we check the
     * condition periodically. */
    while (Null(output = condition(the_env, o))) {
      ecl_musleep(waiting_time(iteration++, &start), 1);
    }
    ecl_bds_unwind1(the_env);
  } ECL_UNWIND_PROTECT_EXIT {
    /* 4) At this point we wrap up. We remove ourselves
     * from the queue and unblock the lisp interrupt
     * signal. Note that we recover the cons for later use.*/
    wait_queue_delete(the_env, o, own_process);
    own_process->process.queue_record = record;
    ECL_RPLACD(record, ECL_NIL);

    /* 5) When this process exits, it may be because it
     * aborts (which we know because output == ECL_NIL), or
     * because the condition is satisfied. In both cases
     * we allow the first in the queue to test again its
     * condition. This is needed for objects, such as
     * semaphores, where the condition may be satisfied
     * more than once. */
    if (Null(output)) {
      ecl_wakeup_waiters(the_env, o, ECL_WAKEUP_ONE);
    }
  } ECL_UNWIND_PROTECT_END;
  ecl_bds_unwind1(the_env);
  return output;
}

/**********************************************************************
 * BLOCKING WAIT QUEUE ALGORITHM
 *
 * This object keeps a list of processes waiting for a condition to
 * happen. The queue is ordered and the only processes that check for
 * the condition are
 *      - The first process to arrive to the queue,
 *      - Each process which is awoken.
 *      - The first process after the list of awoken processes.
 *
 * The idea is that this will ensure some fairness when unblocking the
 * processes, which is important for abstractions such as mutexes or
 * semaphores, where we want equal sharing of resources among processes.
 *
 * This also implies that the waiting processes depend on others to signal
 * when to check for a condition. This happens in two situations
 *      - External code that changes the fields of the queue object
 *        must signal ecl_wakeup_waiters() (See mutex.d, semaphore.d, etc)
 *      - When a process exits ecl_wait_on() it always resignals the next
 *        process in the queue, because a condition may be satisfied more
 *        than once (for instance when a semaphore is changed, more than
 *        one process may be released)
 *
 * The critical part of this algorithm is the fact that processes
 * communicating the change of conditions may do so before, during or
 * after a process has been registered. Since we do not want those signals
 * to be lost, a proper ordering of steps is required.
 */

cl_object
ecl_wait_on(cl_env_ptr env, cl_object (*condition)(cl_env_ptr, cl_object), cl_object o)
{
#if defined(HAVE_SIGPROCMASK)
  volatile const cl_env_ptr the_env = env;
  volatile cl_object own_process = the_env->own_process;
  volatile cl_object record;
  volatile sigset_t original;
  volatile cl_object output;

  /* 0) We reserve a record for the queue. In order to avoid
   * using the garbage collector, we reuse records */
  record = own_process->process.queue_record;
  unlikely_if (record == ECL_NIL) {
    record = ecl_list1(own_process);
  } else {
    own_process->process.queue_record = ECL_NIL;
  }

  /* 1) First we block lisp interrupt signals. This ensures that
   * any awake signal that is issued from here is not lost. */
  {
    int code = ecl_option_values[ECL_OPT_THREAD_INTERRUPT_SIGNAL];
    sigset_t empty;
    sigemptyset(&empty);
    sigaddset(&empty, code);
    pthread_sigmask(SIG_BLOCK, &empty, &original);
  }

  /* 2) Now we add ourselves to the queue. */
  own_process->process.woken_up = ECL_NIL;
  wait_queue_nconc(the_env, o, record);

  ECL_UNWIND_PROTECT_BEGIN(the_env) {
    /* 3) At this point we may receive signals, but we
     * might have missed a wakeup event if that happened
     * between 0) and 2), which is why we start with the
     * check*/
    while (Null(output = condition(the_env, o)))
      {
        /* This will wait until we get a signal that
         * demands some code being executed. Note that
         * this includes our communication signals and
         * the signals used by the GC. Note also that
         * as a consequence we might throw / return
         * which is why need to protect it all with
         * UNWIND-PROTECT. */
        sigsuspend(&original);
      }
  } ECL_UNWIND_PROTECT_EXIT {
    /* 4) At this point we wrap up. We remove ourselves
     * from the queue and unblock the lisp interrupt
     * signal. Note that we recover the cons for later use.*/
    wait_queue_delete(the_env, o, own_process);
    own_process->process.queue_record = record;
    ECL_RPLACD(record, ECL_NIL);

    /* 5) When this process exits, it may be because it
     * aborts (which we know because output == ECL_NIL), or
     * because the condition is satisfied. In both cases
     * we allow the first in the queue to test again its
     * condition. This is needed for objects, such as
     * semaphores, where the condition may be satisfied
     * more than once. */
    if (Null(output)) {
      ecl_wakeup_waiters(the_env, o, ECL_WAKEUP_ONE);
    }

    /* 6) Restoring signals is done last, to ensure that
     * all cleanup steps are performed. */
    pthread_sigmask(SIG_SETMASK, &original, NULL);
  } ECL_UNWIND_PROTECT_END;
  return output;
#else
  return ecl_wait_on_timed(env, condition, o);
#endif
}

cl_object
ecl_waiter_pop(cl_env_ptr the_env, cl_object q)
{
  cl_object output;
  ecl_disable_interrupts_env(the_env);
  ecl_get_spinlock(the_env, &q->queue.spinlock);
  {
    cl_object l;
    output = ECL_NIL;
    for (l = q->queue.list; l != ECL_NIL; l = ECL_CONS_CDR(l)) {
      cl_object p = ECL_CONS_CAR(l);
      if (p->process.phase != ECL_PROCESS_INACTIVE &&
          p->process.phase != ECL_PROCESS_EXITING) {
        output = p;
        break;
      }
    }
  }
  ecl_giveup_spinlock(&q->queue.spinlock);
  ecl_enable_interrupts_env(the_env);
  return output;
}

void
ecl_wakeup_waiters(cl_env_ptr the_env, cl_object q, int flags)
{
  ecl_disable_interrupts_env(the_env);
  ecl_get_spinlock(the_env, &q->queue.spinlock);
  if (q->queue.list != ECL_NIL) {
    /* We scan the list of waiting processes, awaking one
     * or more, depending on flags. In running through the list
     * we eliminate zombie processes --- they should not be here
     * because of the UNWIND-PROTECT in ecl_wait_on(), but
     * sometimes shit happens */
    cl_object *tail, l;
    for (tail = &q->queue.list; (l = *tail) != ECL_NIL; ) {
      cl_object p = ECL_CONS_CAR(l);
      if (p->process.phase == ECL_PROCESS_INACTIVE ||
          p->process.phase == ECL_PROCESS_EXITING) {
        print_lock("removing %p", q, p);
        *tail = ECL_CONS_CDR(l);
      } else {
        print_lock("awaking %p", q, p);
        /* If the process is active, we then
         * simply awake it with a signal.*/
        p->process.woken_up = ECL_T;
        if (flags & ECL_WAKEUP_DELETE)
          *tail = ECL_CONS_CDR(l);
        tail = &ECL_CONS_CDR(l);
        if (flags & ECL_WAKEUP_KILL)
          mp_process_kill(p);
        else
          ecl_wakeup_process(p);
        if (!(flags & ECL_WAKEUP_ALL))
          break;
      }
    }
  }
  ecl_giveup_spinlock(&q->queue.spinlock);
  ecl_process_yield();
}

#undef print_lock

void
print_lock(char *prefix, cl_object l, ...)
{
  static cl_object lock = ECL_NIL;
  va_list args;
  va_start(args, l);
  if (l == ECL_NIL
      || type_of(l) == t_condition_variable
      || ECL_FIXNUMP(l->lock.name)) {
    cl_env_ptr env = ecl_process_env();
    ecl_get_spinlock(env, &lock);
    printf("\n%ld\t", ecl_fixnum(env->own_process->process.name));
    vprintf(prefix, args);
    if (l != ECL_NIL) {
      cl_object p = l->lock.queue_list;
      while (p != ECL_NIL) {
        printf(" %lx", ecl_fixnum(ECL_CONS_CAR(p)->process.name));
        p = ECL_CONS_CDR(p);
      }
    }
    fflush(stdout);
    ecl_giveup_spinlock(&lock);
  }
}
/*#define print_lock(a,b,c) (void)0*/