|
Packit |
67cb25 |
/* rstat/rquantile.c
|
|
Packit |
67cb25 |
*
|
|
Packit |
67cb25 |
* Copyright (C) 2015 Patrick Alken
|
|
Packit |
67cb25 |
*
|
|
Packit |
67cb25 |
* This program is free software; you can redistribute it and/or modify
|
|
Packit |
67cb25 |
* it under the terms of the GNU General Public License as published by
|
|
Packit |
67cb25 |
* the Free Software Foundation; either version 3 of the License, or (at
|
|
Packit |
67cb25 |
* your option) any later version.
|
|
Packit |
67cb25 |
*
|
|
Packit |
67cb25 |
* This program is distributed in the hope that it will be useful, but
|
|
Packit |
67cb25 |
* WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
Packit |
67cb25 |
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
Packit |
67cb25 |
* General Public License for more details.
|
|
Packit |
67cb25 |
*
|
|
Packit |
67cb25 |
* You should have received a copy of the GNU General Public License
|
|
Packit |
67cb25 |
* along with this program; if not, write to the Free Software
|
|
Packit |
67cb25 |
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
|
|
Packit |
67cb25 |
*/
|
|
Packit |
67cb25 |
|
|
Packit |
67cb25 |
#include <config.h>
|
|
Packit |
67cb25 |
#include <stdlib.h>
|
|
Packit |
67cb25 |
#include <math.h>
|
|
Packit |
67cb25 |
#include <gsl/gsl_math.h>
|
|
Packit |
67cb25 |
#include <gsl/gsl_sort.h>
|
|
Packit |
67cb25 |
#include <gsl/gsl_statistics.h>
|
|
Packit |
67cb25 |
#include <gsl/gsl_rstat.h>
|
|
Packit |
67cb25 |
|
|
Packit |
67cb25 |
/*
|
|
Packit |
67cb25 |
* Running quantile calculation based on the paper
|
|
Packit |
67cb25 |
*
|
|
Packit |
67cb25 |
* [1] R. Jain and I. Chlamtac, "The P^2 algorithm for dynamic
|
|
Packit |
67cb25 |
* calculation of quantiles and histograms without storing
|
|
Packit |
67cb25 |
* observations", Communications of the ACM, October 1985
|
|
Packit |
67cb25 |
*/
|
|
Packit |
67cb25 |
|
|
Packit |
67cb25 |
static double calc_psq(const double qp1, const double q, const double qm1,
|
|
Packit |
67cb25 |
const double d, const double np1, const double n, const double nm1);
|
|
Packit |
67cb25 |
|
|
Packit |
67cb25 |
gsl_rstat_quantile_workspace *
|
|
Packit |
67cb25 |
gsl_rstat_quantile_alloc(const double p)
|
|
Packit |
67cb25 |
{
|
|
Packit |
67cb25 |
gsl_rstat_quantile_workspace *w;
|
|
Packit |
67cb25 |
|
|
Packit |
67cb25 |
w = calloc(1, sizeof(gsl_rstat_quantile_workspace));
|
|
Packit |
67cb25 |
if (w == 0)
|
|
Packit |
67cb25 |
{
|
|
Packit |
67cb25 |
GSL_ERROR_NULL ("failed to allocate space for workspace", GSL_ENOMEM);
|
|
Packit |
67cb25 |
}
|
|
Packit |
67cb25 |
|
|
Packit |
67cb25 |
w->p = p;
|
|
Packit |
67cb25 |
|
|
Packit |
67cb25 |
gsl_rstat_quantile_reset(w);
|
|
Packit |
67cb25 |
|
|
Packit |
67cb25 |
return w;
|
|
Packit |
67cb25 |
} /* gsl_rstat_quantile_alloc() */
|
|
Packit |
67cb25 |
|
|
Packit |
67cb25 |
void
|
|
Packit |
67cb25 |
gsl_rstat_quantile_free(gsl_rstat_quantile_workspace *w)
|
|
Packit |
67cb25 |
{
|
|
Packit |
67cb25 |
free(w);
|
|
Packit |
67cb25 |
} /* gsl_rstat_quantile_free() */
|
|
Packit |
67cb25 |
|
|
Packit |
67cb25 |
int
|
|
Packit |
67cb25 |
gsl_rstat_quantile_reset(gsl_rstat_quantile_workspace *w)
|
|
Packit |
67cb25 |
{
|
|
Packit |
67cb25 |
const double p = w->p;
|
|
Packit |
67cb25 |
size_t i;
|
|
Packit |
67cb25 |
|
|
Packit |
67cb25 |
/* initialize positions n */
|
|
Packit |
67cb25 |
for (i = 0; i < 5; ++i)
|
|
Packit |
67cb25 |
w->npos[i] = i + 1;
|
|
Packit |
67cb25 |
|
|
Packit |
67cb25 |
/* initialize n' */
|
|
Packit |
67cb25 |
w->np[0] = 1.0;
|
|
Packit |
67cb25 |
w->np[1] = 1.0 + 2.0 * p;
|
|
Packit |
67cb25 |
w->np[2] = 1.0 + 4.0 * p;
|
|
Packit |
67cb25 |
w->np[3] = 3.0 + 2.0 * p;
|
|
Packit |
67cb25 |
w->np[4] = 5.0;
|
|
Packit |
67cb25 |
|
|
Packit |
67cb25 |
/* initialize dn' */
|
|
Packit |
67cb25 |
w->dnp[0] = 0.0;
|
|
Packit |
67cb25 |
w->dnp[1] = 0.5 * p;
|
|
Packit |
67cb25 |
w->dnp[2] = p;
|
|
Packit |
67cb25 |
w->dnp[3] = 0.5 * (1.0 + p);
|
|
Packit |
67cb25 |
w->dnp[4] = 1.0;
|
|
Packit |
67cb25 |
|
|
Packit |
67cb25 |
w->n = 0;
|
|
Packit |
67cb25 |
|
|
Packit |
67cb25 |
return GSL_SUCCESS;
|
|
Packit |
67cb25 |
}
|
|
Packit |
67cb25 |
|
|
Packit |
67cb25 |
int
|
|
Packit |
67cb25 |
gsl_rstat_quantile_add(const double x, gsl_rstat_quantile_workspace *w)
|
|
Packit |
67cb25 |
{
|
|
Packit |
67cb25 |
if (w->n < 5)
|
|
Packit |
67cb25 |
{
|
|
Packit |
67cb25 |
w->q[w->n] = x;
|
|
Packit |
67cb25 |
}
|
|
Packit |
67cb25 |
else
|
|
Packit |
67cb25 |
{
|
|
Packit |
67cb25 |
int i;
|
|
Packit |
67cb25 |
int k = -1;
|
|
Packit |
67cb25 |
|
|
Packit |
67cb25 |
if (w->n == 5)
|
|
Packit |
67cb25 |
{
|
|
Packit |
67cb25 |
/* initialization: sort the first five heights */
|
|
Packit |
67cb25 |
gsl_sort(w->q, 1, w->n);
|
|
Packit |
67cb25 |
}
|
|
Packit |
67cb25 |
|
|
Packit |
67cb25 |
/* step B1: find k such that q_k <= x < q_{k+1} */
|
|
Packit |
67cb25 |
if (x < w->q[0])
|
|
Packit |
67cb25 |
{
|
|
Packit |
67cb25 |
w->q[0] = x;
|
|
Packit |
67cb25 |
k = 0;
|
|
Packit |
67cb25 |
}
|
|
Packit |
67cb25 |
else if (x >= w->q[4])
|
|
Packit |
67cb25 |
{
|
|
Packit |
67cb25 |
w->q[4] = x;
|
|
Packit |
67cb25 |
k = 3;
|
|
Packit |
67cb25 |
}
|
|
Packit |
67cb25 |
else
|
|
Packit |
67cb25 |
{
|
|
Packit |
67cb25 |
for (i = 0; i <= 3; ++i)
|
|
Packit |
67cb25 |
{
|
|
Packit |
67cb25 |
if (w->q[i] <= x && x < w->q[i + 1])
|
|
Packit |
67cb25 |
{
|
|
Packit |
67cb25 |
k = i;
|
|
Packit |
67cb25 |
break;
|
|
Packit |
67cb25 |
}
|
|
Packit |
67cb25 |
}
|
|
Packit |
67cb25 |
}
|
|
Packit |
67cb25 |
|
|
Packit |
67cb25 |
if (k < 0)
|
|
Packit |
67cb25 |
{
|
|
Packit |
67cb25 |
/* we could get here if x is nan */
|
|
Packit |
67cb25 |
GSL_ERROR ("invalid input argument x", GSL_EINVAL);
|
|
Packit |
67cb25 |
}
|
|
Packit |
67cb25 |
|
|
Packit |
67cb25 |
/* step B2(a): update n_i */
|
|
Packit |
67cb25 |
for (i = k + 1; i <= 4; ++i)
|
|
Packit |
67cb25 |
++(w->npos[i]);
|
|
Packit |
67cb25 |
|
|
Packit |
67cb25 |
/* step B2(b): update n_i' */
|
|
Packit |
67cb25 |
for (i = 0; i < 5; ++i)
|
|
Packit |
67cb25 |
w->np[i] += w->dnp[i];
|
|
Packit |
67cb25 |
|
|
Packit |
67cb25 |
/* step B3: update heights */
|
|
Packit |
67cb25 |
for (i = 1; i <= 3; ++i)
|
|
Packit |
67cb25 |
{
|
|
Packit |
67cb25 |
double ni = (double) w->npos[i];
|
|
Packit |
67cb25 |
double d = w->np[i] - ni;
|
|
Packit |
67cb25 |
|
|
Packit |
67cb25 |
if ((d >= 1.0 && (w->npos[i + 1] - w->npos[i] > 1)) ||
|
|
Packit |
67cb25 |
(d <= -1.0 && (w->npos[i - 1] - w->npos[i] < -1)))
|
|
Packit |
67cb25 |
{
|
|
Packit |
67cb25 |
int dsign = (d > 0.0) ? 1 : -1;
|
|
Packit |
67cb25 |
double qp1 = w->q[i + 1];
|
|
Packit |
67cb25 |
double qi = w->q[i];
|
|
Packit |
67cb25 |
double qm1 = w->q[i - 1];
|
|
Packit |
67cb25 |
double np1 = (double) w->npos[i + 1];
|
|
Packit |
67cb25 |
double nm1 = (double) w->npos[i - 1];
|
|
Packit |
67cb25 |
double qp = calc_psq(qp1, qi, qm1, (double) dsign,
|
|
Packit |
67cb25 |
np1, ni, nm1);
|
|
Packit |
67cb25 |
|
|
Packit |
67cb25 |
if (qm1 < qp && qp < qp1)
|
|
Packit |
67cb25 |
w->q[i] = qp;
|
|
Packit |
67cb25 |
else
|
|
Packit |
67cb25 |
{
|
|
Packit |
67cb25 |
/* use linear formula */
|
|
Packit |
67cb25 |
w->q[i] += dsign * (w->q[i + dsign] - qi) / ((double) w->npos[i + dsign] - ni);
|
|
Packit |
67cb25 |
}
|
|
Packit |
67cb25 |
|
|
Packit |
67cb25 |
w->npos[i] += dsign;
|
|
Packit |
67cb25 |
}
|
|
Packit |
67cb25 |
}
|
|
Packit |
67cb25 |
}
|
|
Packit |
67cb25 |
|
|
Packit |
67cb25 |
++(w->n);
|
|
Packit |
67cb25 |
|
|
Packit |
67cb25 |
return GSL_SUCCESS;
|
|
Packit |
67cb25 |
} /* gsl_rstat_quantile_add() */
|
|
Packit |
67cb25 |
|
|
Packit |
67cb25 |
double
|
|
Packit |
67cb25 |
gsl_rstat_quantile_get(gsl_rstat_quantile_workspace *w)
|
|
Packit |
67cb25 |
{
|
|
Packit |
67cb25 |
if (w->n >= 5)
|
|
Packit |
67cb25 |
{
|
|
Packit |
67cb25 |
return w->q[2];
|
|
Packit |
67cb25 |
}
|
|
Packit |
67cb25 |
else
|
|
Packit |
67cb25 |
{
|
|
Packit |
67cb25 |
/* not yet initialized */
|
|
Packit |
67cb25 |
gsl_sort(w->q, 1, w->n);
|
|
Packit |
67cb25 |
return gsl_stats_quantile_from_sorted_data(w->q, 1, w->n, w->p);
|
|
Packit |
67cb25 |
}
|
|
Packit |
67cb25 |
} /* gsl_rstat_quantile_get() */
|
|
Packit |
67cb25 |
|
|
Packit |
67cb25 |
static double
|
|
Packit |
67cb25 |
calc_psq(const double qp1, const double q, const double qm1,
|
|
Packit |
67cb25 |
const double d, const double np1, const double n, const double nm1)
|
|
Packit |
67cb25 |
{
|
|
Packit |
67cb25 |
double outer = d / (np1 - nm1);
|
|
Packit |
67cb25 |
double inner_left = (n - nm1 + d) * (qp1 - q) / (np1 - n);
|
|
Packit |
67cb25 |
double inner_right = (np1 - n - d) * (q - qm1) / (n - nm1);
|
|
Packit |
67cb25 |
|
|
Packit |
67cb25 |
return q + outer * (inner_left + inner_right);
|
|
Packit |
67cb25 |
} /* calc_psq() */
|