Blame rstat/rquantile.c

Packit 67cb25
/* rstat/rquantile.c
Packit 67cb25
 * 
Packit 67cb25
 * Copyright (C) 2015 Patrick Alken
Packit 67cb25
 * 
Packit 67cb25
 * This program is free software; you can redistribute it and/or modify
Packit 67cb25
 * it under the terms of the GNU General Public License as published by
Packit 67cb25
 * the Free Software Foundation; either version 3 of the License, or (at
Packit 67cb25
 * your option) any later version.
Packit 67cb25
 * 
Packit 67cb25
 * This program is distributed in the hope that it will be useful, but
Packit 67cb25
 * WITHOUT ANY WARRANTY; without even the implied warranty of
Packit 67cb25
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
Packit 67cb25
 * General Public License for more details.
Packit 67cb25
 * 
Packit 67cb25
 * You should have received a copy of the GNU General Public License
Packit 67cb25
 * along with this program; if not, write to the Free Software
Packit 67cb25
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
Packit 67cb25
 */
Packit 67cb25
Packit 67cb25
#include <config.h>
Packit 67cb25
#include <stdlib.h>
Packit 67cb25
#include <math.h>
Packit 67cb25
#include <gsl/gsl_math.h>
Packit 67cb25
#include <gsl/gsl_sort.h>
Packit 67cb25
#include <gsl/gsl_statistics.h>
Packit 67cb25
#include <gsl/gsl_rstat.h>
Packit 67cb25
Packit 67cb25
/*
Packit 67cb25
 * Running quantile calculation based on the paper
Packit 67cb25
 *
Packit 67cb25
 * [1] R. Jain and I. Chlamtac, "The P^2 algorithm for dynamic
Packit 67cb25
 *     calculation of quantiles and histograms without storing
Packit 67cb25
 *     observations", Communications of the ACM, October 1985
Packit 67cb25
 */
Packit 67cb25
Packit 67cb25
static double calc_psq(const double qp1, const double q, const double qm1,
Packit 67cb25
                       const double d, const double np1, const double n, const double nm1);
Packit 67cb25
Packit 67cb25
gsl_rstat_quantile_workspace *
Packit 67cb25
gsl_rstat_quantile_alloc(const double p)
Packit 67cb25
{
Packit 67cb25
  gsl_rstat_quantile_workspace *w;
Packit 67cb25
Packit 67cb25
  w = calloc(1, sizeof(gsl_rstat_quantile_workspace));
Packit 67cb25
  if (w == 0)
Packit 67cb25
    {
Packit 67cb25
      GSL_ERROR_NULL ("failed to allocate space for workspace", GSL_ENOMEM);
Packit 67cb25
    }
Packit 67cb25
Packit 67cb25
  w->p = p;
Packit 67cb25
Packit 67cb25
  gsl_rstat_quantile_reset(w);
Packit 67cb25
Packit 67cb25
  return w;
Packit 67cb25
} /* gsl_rstat_quantile_alloc() */
Packit 67cb25
Packit 67cb25
void
Packit 67cb25
gsl_rstat_quantile_free(gsl_rstat_quantile_workspace *w)
Packit 67cb25
{
Packit 67cb25
  free(w);
Packit 67cb25
} /* gsl_rstat_quantile_free() */
Packit 67cb25
Packit 67cb25
int
Packit 67cb25
gsl_rstat_quantile_reset(gsl_rstat_quantile_workspace *w)
Packit 67cb25
{
Packit 67cb25
  const double p = w->p;
Packit 67cb25
  size_t i;
Packit 67cb25
Packit 67cb25
  /* initialize positions n */
Packit 67cb25
  for (i = 0; i < 5; ++i)
Packit 67cb25
    w->npos[i] = i + 1;
Packit 67cb25
Packit 67cb25
  /* initialize n' */
Packit 67cb25
  w->np[0] = 1.0;
Packit 67cb25
  w->np[1] = 1.0 + 2.0 * p;
Packit 67cb25
  w->np[2] = 1.0 + 4.0 * p;
Packit 67cb25
  w->np[3] = 3.0 + 2.0 * p;
Packit 67cb25
  w->np[4] = 5.0;
Packit 67cb25
Packit 67cb25
  /* initialize dn' */
Packit 67cb25
  w->dnp[0] = 0.0;
Packit 67cb25
  w->dnp[1] = 0.5 * p;
Packit 67cb25
  w->dnp[2] = p;
Packit 67cb25
  w->dnp[3] = 0.5 * (1.0 + p);
Packit 67cb25
  w->dnp[4] = 1.0;
Packit 67cb25
Packit 67cb25
  w->n = 0;
Packit 67cb25
Packit 67cb25
  return GSL_SUCCESS;
Packit 67cb25
}
Packit 67cb25
Packit 67cb25
int
Packit 67cb25
gsl_rstat_quantile_add(const double x, gsl_rstat_quantile_workspace *w)
Packit 67cb25
{
Packit 67cb25
  if (w->n < 5)
Packit 67cb25
    {
Packit 67cb25
      w->q[w->n] = x;
Packit 67cb25
    }
Packit 67cb25
  else
Packit 67cb25
    {
Packit 67cb25
      int i;
Packit 67cb25
      int k = -1;
Packit 67cb25
Packit 67cb25
      if (w->n == 5)
Packit 67cb25
        {
Packit 67cb25
          /* initialization: sort the first five heights */
Packit 67cb25
          gsl_sort(w->q, 1, w->n);
Packit 67cb25
        }
Packit 67cb25
Packit 67cb25
      /* step B1: find k such that q_k <= x < q_{k+1} */
Packit 67cb25
      if (x < w->q[0])
Packit 67cb25
        {
Packit 67cb25
          w->q[0] = x;
Packit 67cb25
          k = 0;
Packit 67cb25
        }
Packit 67cb25
      else if (x >= w->q[4])
Packit 67cb25
        {
Packit 67cb25
          w->q[4] = x;
Packit 67cb25
          k = 3;
Packit 67cb25
        }
Packit 67cb25
      else
Packit 67cb25
        {
Packit 67cb25
          for (i = 0; i <= 3; ++i)
Packit 67cb25
            {
Packit 67cb25
              if (w->q[i] <= x && x < w->q[i + 1])
Packit 67cb25
                {
Packit 67cb25
                  k = i;
Packit 67cb25
                  break;
Packit 67cb25
                }
Packit 67cb25
            }
Packit 67cb25
        }
Packit 67cb25
Packit 67cb25
      if (k < 0)
Packit 67cb25
        {
Packit 67cb25
          /* we could get here if x is nan */
Packit 67cb25
          GSL_ERROR ("invalid input argument x", GSL_EINVAL);
Packit 67cb25
        }
Packit 67cb25
Packit 67cb25
      /* step B2(a): update n_i */
Packit 67cb25
      for (i = k + 1; i <= 4; ++i)
Packit 67cb25
        ++(w->npos[i]);
Packit 67cb25
Packit 67cb25
      /* step B2(b): update n_i' */
Packit 67cb25
      for (i = 0; i < 5; ++i)
Packit 67cb25
        w->np[i] += w->dnp[i];
Packit 67cb25
Packit 67cb25
      /* step B3: update heights */
Packit 67cb25
      for (i = 1; i <= 3; ++i)
Packit 67cb25
        {
Packit 67cb25
          double ni = (double) w->npos[i];
Packit 67cb25
          double d = w->np[i] - ni;
Packit 67cb25
Packit 67cb25
          if ((d >= 1.0 && (w->npos[i + 1] - w->npos[i] > 1)) ||
Packit 67cb25
              (d <= -1.0 && (w->npos[i - 1] - w->npos[i] < -1)))
Packit 67cb25
            {
Packit 67cb25
              int dsign = (d > 0.0) ? 1 : -1;
Packit 67cb25
              double qp1 = w->q[i + 1];
Packit 67cb25
              double qi = w->q[i];
Packit 67cb25
              double qm1 = w->q[i - 1];
Packit 67cb25
              double np1 = (double) w->npos[i + 1];
Packit 67cb25
              double nm1 = (double) w->npos[i - 1];
Packit 67cb25
              double qp = calc_psq(qp1, qi, qm1, (double) dsign,
Packit 67cb25
                                   np1, ni, nm1);
Packit 67cb25
Packit 67cb25
              if (qm1 < qp && qp < qp1)
Packit 67cb25
                w->q[i] = qp;
Packit 67cb25
              else
Packit 67cb25
                {
Packit 67cb25
                  /* use linear formula */
Packit 67cb25
                  w->q[i] += dsign * (w->q[i + dsign] - qi) / ((double) w->npos[i + dsign] - ni);
Packit 67cb25
                }
Packit 67cb25
Packit 67cb25
              w->npos[i] += dsign;
Packit 67cb25
            }
Packit 67cb25
        }
Packit 67cb25
    }
Packit 67cb25
Packit 67cb25
  ++(w->n);
Packit 67cb25
Packit 67cb25
  return GSL_SUCCESS;
Packit 67cb25
} /* gsl_rstat_quantile_add() */
Packit 67cb25
Packit 67cb25
double
Packit 67cb25
gsl_rstat_quantile_get(gsl_rstat_quantile_workspace *w)
Packit 67cb25
{
Packit 67cb25
  if (w->n >= 5)
Packit 67cb25
    {
Packit 67cb25
      return w->q[2];
Packit 67cb25
    }
Packit 67cb25
  else
Packit 67cb25
    {
Packit 67cb25
      /* not yet initialized */
Packit 67cb25
      gsl_sort(w->q, 1, w->n);
Packit 67cb25
      return gsl_stats_quantile_from_sorted_data(w->q, 1, w->n, w->p);
Packit 67cb25
    }
Packit 67cb25
} /* gsl_rstat_quantile_get() */
Packit 67cb25
Packit 67cb25
static double
Packit 67cb25
calc_psq(const double qp1, const double q, const double qm1,
Packit 67cb25
         const double d, const double np1, const double n, const double nm1)
Packit 67cb25
{
Packit 67cb25
  double outer = d / (np1 - nm1);
Packit 67cb25
  double inner_left = (n - nm1 + d) * (qp1 - q) / (np1 - n);
Packit 67cb25
  double inner_right = (np1 - n - d) * (q - qm1) / (n - nm1);
Packit 67cb25
Packit 67cb25
  return q + outer * (inner_left + inner_right);
Packit 67cb25
} /* calc_psq() */