Blame rstat/test.c

Packit 67cb25
/* rstat/test.c
Packit 67cb25
 * 
Packit 67cb25
 * Copyright (C) 2015 Patrick Alken
Packit 67cb25
 * 
Packit 67cb25
 * This program is free software; you can redistribute it and/or modify
Packit 67cb25
 * it under the terms of the GNU General Public License as published by
Packit 67cb25
 * the Free Software Foundation; either version 3 of the License, or (at
Packit 67cb25
 * your option) any later version.
Packit 67cb25
 * 
Packit 67cb25
 * This program is distributed in the hope that it will be useful, but
Packit 67cb25
 * WITHOUT ANY WARRANTY; without even the implied warranty of
Packit 67cb25
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
Packit 67cb25
 * General Public License for more details.
Packit 67cb25
 * 
Packit 67cb25
 * You should have received a copy of the GNU General Public License
Packit 67cb25
 * along with this program; if not, write to the Free Software
Packit 67cb25
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
Packit 67cb25
 */
Packit 67cb25
Packit 67cb25
#include <config.h>
Packit 67cb25
#include <stdlib.h>
Packit 67cb25
#include <math.h>
Packit 67cb25
#include <string.h>
Packit 67cb25
#include <gsl/gsl_math.h>
Packit 67cb25
#include <gsl/gsl_rstat.h>
Packit 67cb25
#include <gsl/gsl_sort.h>
Packit 67cb25
#include <gsl/gsl_statistics.h>
Packit 67cb25
#include <gsl/gsl_test.h>
Packit 67cb25
#include <gsl/gsl_rng.h>
Packit 67cb25
#include <gsl/gsl_randist.h>
Packit 67cb25
#include <gsl/gsl_ieee_utils.h>
Packit 67cb25
Packit 67cb25
double *
Packit 67cb25
random_data(const size_t n, gsl_rng *r)
Packit 67cb25
{
Packit 67cb25
  size_t i;
Packit 67cb25
  double *data = malloc(n * sizeof(double));
Packit 67cb25
Packit 67cb25
  for (i = 0; i < n; ++i)
Packit 67cb25
    data[i] = gsl_rng_uniform(r);
Packit 67cb25
Packit 67cb25
  return data;
Packit 67cb25
}
Packit 67cb25
Packit 67cb25
void
Packit 67cb25
test_basic(const size_t n, const double data[], const double tol)
Packit 67cb25
{
Packit 67cb25
  gsl_rstat_workspace *rstat_workspace_p = gsl_rstat_alloc();
Packit 67cb25
  const double expected_mean = gsl_stats_mean(data, 1, n);
Packit 67cb25
  const double expected_var = gsl_stats_variance(data, 1, n);
Packit 67cb25
  const double expected_sd = gsl_stats_sd(data, 1, n);
Packit 67cb25
  const double expected_sd_mean = expected_sd / sqrt((double) n);
Packit 67cb25
  const double expected_skew = gsl_stats_skew(data, 1, n);
Packit 67cb25
  const double expected_kurtosis = gsl_stats_kurtosis(data, 1, n);
Packit 67cb25
  double expected_rms = 0.0;
Packit 67cb25
  double mean, var, sd, sd_mean, rms, skew, kurtosis;
Packit 67cb25
  size_t i, num;
Packit 67cb25
  int status;
Packit 67cb25
Packit 67cb25
  /* compute expected rms */
Packit 67cb25
  for (i = 0; i < n; ++i)
Packit 67cb25
    expected_rms += data[i] * data[i];
Packit 67cb25
Packit 67cb25
  expected_rms = sqrt(expected_rms / n);
Packit 67cb25
Packit 67cb25
  /* add data to rstat workspace */
Packit 67cb25
  for (i = 0; i < n; ++i)
Packit 67cb25
    gsl_rstat_add(data[i], rstat_workspace_p);
Packit 67cb25
Packit 67cb25
  mean     = gsl_rstat_mean(rstat_workspace_p);
Packit 67cb25
  var      = gsl_rstat_variance(rstat_workspace_p);
Packit 67cb25
  sd       = gsl_rstat_sd(rstat_workspace_p);
Packit 67cb25
  sd_mean  = gsl_rstat_sd_mean(rstat_workspace_p);
Packit 67cb25
  rms      = gsl_rstat_rms(rstat_workspace_p);
Packit 67cb25
  skew     = gsl_rstat_skew(rstat_workspace_p);
Packit 67cb25
  kurtosis = gsl_rstat_kurtosis(rstat_workspace_p);
Packit 67cb25
  num      = gsl_rstat_n(rstat_workspace_p);
Packit 67cb25
Packit 67cb25
  gsl_test_int(num, n, "n n=%zu" , n);
Packit 67cb25
  gsl_test_rel(mean, expected_mean, tol, "mean n=%zu", n);
Packit 67cb25
  gsl_test_rel(var, expected_var, tol, "variance n=%zu", n);
Packit 67cb25
  gsl_test_rel(sd, expected_sd, tol, "stddev n=%zu", n);
Packit 67cb25
  gsl_test_rel(sd_mean, expected_sd_mean, tol, "stddev_mean n=%zu", n);
Packit 67cb25
  gsl_test_rel(rms, expected_rms, tol, "rms n=%zu", n);
Packit 67cb25
  gsl_test_rel(skew, expected_skew, tol, "skew n=%zu", n);
Packit 67cb25
  gsl_test_rel(kurtosis, expected_kurtosis, tol, "kurtosis n=%zu", n);
Packit 67cb25
Packit 67cb25
  status = gsl_rstat_reset(rstat_workspace_p);
Packit 67cb25
  gsl_test_int(status, GSL_SUCCESS, "rstat returned success");
Packit 67cb25
  num = gsl_rstat_n(rstat_workspace_p);
Packit 67cb25
Packit 67cb25
  gsl_test_int(num, 0, "n n=%zu" , n);
Packit 67cb25
Packit 67cb25
  gsl_rstat_free(rstat_workspace_p);
Packit 67cb25
}
Packit 67cb25
Packit 67cb25
void
Packit 67cb25
test_quantile(const double p, const double data[], const size_t n,
Packit 67cb25
              const double expected, const double tol, const char *desc)
Packit 67cb25
{
Packit 67cb25
  gsl_rstat_quantile_workspace *w = gsl_rstat_quantile_alloc(p);
Packit 67cb25
  double result;
Packit 67cb25
  size_t i;
Packit 67cb25
Packit 67cb25
  for (i = 0; i < n; ++i)
Packit 67cb25
    gsl_rstat_quantile_add(data[i], w);
Packit 67cb25
Packit 67cb25
  result = gsl_rstat_quantile_get(w);
Packit 67cb25
Packit 67cb25
  if (fabs(expected) < 1.0e-4)
Packit 67cb25
    gsl_test_abs(result, expected, tol, "%s p=%g", desc, p);
Packit 67cb25
  else
Packit 67cb25
    gsl_test_rel(result, expected, tol, "%s p=%g", desc, p);
Packit 67cb25
Packit 67cb25
  gsl_rstat_quantile_free(w);
Packit 67cb25
}
Packit 67cb25
Packit 67cb25
int
Packit 67cb25
main()
Packit 67cb25
{
Packit 67cb25
  gsl_rng *r = gsl_rng_alloc(gsl_rng_default);
Packit 67cb25
  const double tol1 = 1.0e-8;
Packit 67cb25
  const double tol2 = 1.0e-3;
Packit 67cb25
Packit 67cb25
  gsl_ieee_env_setup();
Packit 67cb25
Packit 67cb25
  {
Packit 67cb25
    const size_t N = 2000000;
Packit 67cb25
    double *data = random_data(N, r);
Packit 67cb25
    double data2[] = { 4.0, 7.0, 13.0, 16.0, -5.0 };
Packit 67cb25
    size_t i;
Packit 67cb25
Packit 67cb25
    test_basic(2, data, tol1);
Packit 67cb25
    test_basic(100, data, tol1);
Packit 67cb25
    test_basic(1000, data, tol1);
Packit 67cb25
    test_basic(10000, data, tol1);
Packit 67cb25
    test_basic(50000, data, tol1);
Packit 67cb25
    test_basic(80000, data, tol1);
Packit 67cb25
    test_basic(1500000, data, tol1);
Packit 67cb25
    test_basic(2000000, data, tol1);
Packit 67cb25
Packit 67cb25
    for (i = 0; i < 5; ++i)
Packit 67cb25
      data2[i] += 1.0e9;
Packit 67cb25
Packit 67cb25
    test_basic(5, data2, tol1);
Packit 67cb25
Packit 67cb25
    free(data);
Packit 67cb25
  }
Packit 67cb25
Packit 67cb25
  {
Packit 67cb25
    /* dataset from Jain and Chlamtac paper */
Packit 67cb25
    const size_t n_jain = 20;
Packit 67cb25
    const double data_jain[] = {  0.02,  0.15,  0.74,  3.39,  0.83,
Packit 67cb25
                                  22.37, 10.15, 15.43, 38.62, 15.92,
Packit 67cb25
                                  34.60, 10.28,  1.47,  0.40,  0.05,
Packit 67cb25
                                  11.39,  0.27,  0.42,  0.09, 11.37 };
Packit 67cb25
    double expected_jain = 4.44063435326;
Packit 67cb25
  
Packit 67cb25
    test_quantile(0.5, data_jain, n_jain, expected_jain, tol1, "jain");
Packit 67cb25
  }
Packit 67cb25
Packit 67cb25
  {
Packit 67cb25
    size_t n = 1000000;
Packit 67cb25
    double *data = malloc(n * sizeof(double));
Packit 67cb25
    double *sorted_data = malloc(n * sizeof(double));
Packit 67cb25
    gsl_rstat_workspace *rstat_workspace_p = gsl_rstat_alloc();
Packit 67cb25
    double p;
Packit 67cb25
    size_t i;
Packit 67cb25
Packit 67cb25
    for (i = 0; i < n; ++i)
Packit 67cb25
      {
Packit 67cb25
        data[i] = gsl_ran_gaussian_tail(r, 1.3, 1.0);
Packit 67cb25
        gsl_rstat_add(data[i], rstat_workspace_p);
Packit 67cb25
      }
Packit 67cb25
Packit 67cb25
    memcpy(sorted_data, data, n * sizeof(double));
Packit 67cb25
    gsl_sort(sorted_data, 1, n);
Packit 67cb25
Packit 67cb25
    /* test quantile calculation */
Packit 67cb25
    for (p = 0.1; p <= 0.9; p += 0.1)
Packit 67cb25
      {
Packit 67cb25
        double expected = gsl_stats_quantile_from_sorted_data(sorted_data, 1, n, p);
Packit 67cb25
        test_quantile(p, data, n, expected, tol2, "gauss");
Packit 67cb25
      }
Packit 67cb25
Packit 67cb25
    /* test mean, variance */
Packit 67cb25
    {
Packit 67cb25
      const double expected_mean = gsl_stats_mean(data, 1, n);
Packit 67cb25
      const double expected_var = gsl_stats_variance(data, 1, n);
Packit 67cb25
      const double expected_sd = gsl_stats_sd(data, 1, n);
Packit 67cb25
      const double expected_skew = gsl_stats_skew(data, 1, n);
Packit 67cb25
      const double expected_kurtosis = gsl_stats_kurtosis(data, 1, n);
Packit 67cb25
      const double expected_median = gsl_stats_quantile_from_sorted_data(sorted_data, 1, n, 0.5);
Packit 67cb25
Packit 67cb25
      const double mean = gsl_rstat_mean(rstat_workspace_p);
Packit 67cb25
      const double var = gsl_rstat_variance(rstat_workspace_p);
Packit 67cb25
      const double sd = gsl_rstat_sd(rstat_workspace_p);
Packit 67cb25
      const double skew = gsl_rstat_skew(rstat_workspace_p);
Packit 67cb25
      const double kurtosis = gsl_rstat_kurtosis(rstat_workspace_p);
Packit 67cb25
      const double median = gsl_rstat_median(rstat_workspace_p);
Packit 67cb25
Packit 67cb25
      gsl_test_rel(mean, expected_mean, tol1, "mean");
Packit 67cb25
      gsl_test_rel(var, expected_var, tol1, "variance");
Packit 67cb25
      gsl_test_rel(sd, expected_sd, tol1, "stddev");
Packit 67cb25
      gsl_test_rel(skew, expected_skew, tol1, "skew");
Packit 67cb25
      gsl_test_rel(kurtosis, expected_kurtosis, tol1, "kurtosis");
Packit 67cb25
      gsl_test_abs(median, expected_median, tol2, "median");
Packit 67cb25
    }
Packit 67cb25
Packit 67cb25
    free(data);
Packit 67cb25
    free(sorted_data);
Packit 67cb25
    gsl_rstat_free(rstat_workspace_p);
Packit 67cb25
  }
Packit 67cb25
Packit 67cb25
  gsl_rng_free(r);
Packit 67cb25
Packit 67cb25
  exit (gsl_test_summary());
Packit 67cb25
}