Blame tune/common.c

Packit 5c3484
/* Shared speed subroutines.
Packit 5c3484
Packit 5c3484
Copyright 1999-2006, 2008-2015 Free Software Foundation, Inc.
Packit 5c3484
Packit 5c3484
This file is part of the GNU MP Library.
Packit 5c3484
Packit 5c3484
The GNU MP Library is free software; you can redistribute it and/or modify
Packit 5c3484
it under the terms of either:
Packit 5c3484
Packit 5c3484
  * the GNU Lesser General Public License as published by the Free
Packit 5c3484
    Software Foundation; either version 3 of the License, or (at your
Packit 5c3484
    option) any later version.
Packit 5c3484
Packit 5c3484
or
Packit 5c3484
Packit 5c3484
  * the GNU General Public License as published by the Free Software
Packit 5c3484
    Foundation; either version 2 of the License, or (at your option) any
Packit 5c3484
    later version.
Packit 5c3484
Packit 5c3484
or both in parallel, as here.
Packit 5c3484
Packit 5c3484
The GNU MP Library is distributed in the hope that it will be useful, but
Packit 5c3484
WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
Packit 5c3484
or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
Packit 5c3484
for more details.
Packit 5c3484
Packit 5c3484
You should have received copies of the GNU General Public License and the
Packit 5c3484
GNU Lesser General Public License along with the GNU MP Library.  If not,
Packit 5c3484
see https://www.gnu.org/licenses/.  */
Packit 5c3484
Packit 5c3484
#define __GMP_NO_ATTRIBUTE_CONST_PURE
Packit 5c3484
Packit 5c3484
#include <errno.h>
Packit 5c3484
#include <fcntl.h>
Packit 5c3484
#include <math.h>
Packit 5c3484
#include <stdio.h>
Packit 5c3484
#include <stdlib.h> /* for qsort */
Packit 5c3484
#include <string.h>
Packit 5c3484
#include <unistd.h>
Packit 5c3484
#if 0
Packit 5c3484
#include <sys/ioctl.h>
Packit 5c3484
#endif
Packit 5c3484
Packit 5c3484
#include "gmp.h"
Packit 5c3484
#include "gmp-impl.h"
Packit 5c3484
#include "longlong.h"
Packit 5c3484
Packit 5c3484
#include "tests.h"
Packit 5c3484
#include "speed.h"
Packit 5c3484
Packit 5c3484
Packit 5c3484
int   speed_option_addrs = 0;
Packit 5c3484
int   speed_option_verbose = 0;
Packit 5c3484
int   speed_option_cycles_broken = 0;
Packit 5c3484
Packit 5c3484
Packit 5c3484
/* Provide __clz_tab even if it's not required, for the benefit of new code
Packit 5c3484
   being tested with many.pl. */
Packit 5c3484
#ifndef COUNT_LEADING_ZEROS_NEED_CLZ_TAB
Packit 5c3484
#define COUNT_LEADING_ZEROS_NEED_CLZ_TAB
Packit 5c3484
#include "mp_clz_tab.c"
Packit 5c3484
#undef COUNT_LEADING_ZEROS_NEED_CLZ_TAB
Packit 5c3484
#endif
Packit 5c3484
Packit 5c3484
Packit 5c3484
void
Packit 5c3484
pentium_wbinvd(void)
Packit 5c3484
{
Packit 5c3484
#if 0
Packit 5c3484
  {
Packit 5c3484
    static int  fd = -2;
Packit 5c3484
Packit 5c3484
    if (fd == -2)
Packit 5c3484
      {
Packit 5c3484
	fd = open ("/dev/wbinvd", O_RDWR);
Packit 5c3484
	if (fd == -1)
Packit 5c3484
	  perror ("open /dev/wbinvd");
Packit 5c3484
      }
Packit 5c3484
Packit 5c3484
    if (fd != -1)
Packit 5c3484
      ioctl (fd, 0, 0);
Packit 5c3484
  }
Packit 5c3484
#endif
Packit 5c3484
Packit 5c3484
#if 0
Packit 5c3484
#define WBINVDSIZE  1024*1024*2
Packit 5c3484
  {
Packit 5c3484
    static char  *p = NULL;
Packit 5c3484
    int   i, sum;
Packit 5c3484
Packit 5c3484
    if (p == NULL)
Packit 5c3484
      p = malloc (WBINVDSIZE);
Packit 5c3484
Packit 5c3484
#if 0
Packit 5c3484
    for (i = 0; i < WBINVDSIZE; i++)
Packit 5c3484
      p[i] = i & 0xFF;
Packit 5c3484
#endif
Packit 5c3484
Packit 5c3484
    sum = 0;
Packit 5c3484
    for (i = 0; i < WBINVDSIZE; i++)
Packit 5c3484
      sum += p[i];
Packit 5c3484
Packit 5c3484
    mpn_cache_fill_dummy (sum);
Packit 5c3484
  }
Packit 5c3484
#endif
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
Packit 5c3484
int
Packit 5c3484
double_cmp_ptr (const double *p, const double *q)
Packit 5c3484
{
Packit 5c3484
  if (*p > *q)  return 1;
Packit 5c3484
  if (*p < *q)  return -1;
Packit 5c3484
  return 0;
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
Packit 5c3484
/* Measure the speed of a given routine.
Packit 5c3484
Packit 5c3484
   The routine is run with enough repetitions to make it take at least
Packit 5c3484
   speed_precision * speed_unittime.  This aims to minimize the effects of a
Packit 5c3484
   limited accuracy time base and the overhead of the measuring itself.
Packit 5c3484
Packit 5c3484
   Measurements are made looking for 4 results within TOLERANCE of each
Packit 5c3484
   other (or 3 for routines taking longer than 2 seconds).  This aims to get
Packit 5c3484
   an accurate reading even if some runs are bloated by interrupts or task
Packit 5c3484
   switches or whatever.
Packit 5c3484
Packit 5c3484
   The given (*fun)() is expected to run its function "s->reps" many times
Packit 5c3484
   and return the total elapsed time measured using speed_starttime() and
Packit 5c3484
   speed_endtime().  If the function doesn't support the given s->size or
Packit 5c3484
   s->r, -1.0 should be returned.  See the various base routines below.  */
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_measure (double (*fun) (struct speed_params *s), struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
#define TOLERANCE    1.01  /* 1% */
Packit 5c3484
  const int max_zeros = 10;
Packit 5c3484
Packit 5c3484
  struct speed_params  s_dummy;
Packit 5c3484
  int     i, j, e;
Packit 5c3484
  double  t[30];
Packit 5c3484
  double  t_unsorted[30];
Packit 5c3484
  double  reps_d;
Packit 5c3484
  int     zeros = 0;
Packit 5c3484
Packit 5c3484
  /* Use dummy parameters if caller doesn't provide any.  Only a few special
Packit 5c3484
     "fun"s will cope with this, speed_noop() is one.  */
Packit 5c3484
  if (s == NULL)
Packit 5c3484
    {
Packit 5c3484
      memset (&s_dummy, '\0', sizeof (s_dummy));
Packit 5c3484
      s = &s_dummy;
Packit 5c3484
    }
Packit 5c3484
Packit 5c3484
  s->reps = 1;
Packit 5c3484
  s->time_divisor = 1.0;
Packit 5c3484
  for (i = 0; i < numberof (t); i++)
Packit 5c3484
    {
Packit 5c3484
      for (;;)
Packit 5c3484
	{
Packit 5c3484
	  s->src_num = 0;
Packit 5c3484
	  s->dst_num = 0;
Packit 5c3484
Packit 5c3484
	  t[i] = (*fun) (s);
Packit 5c3484
Packit 5c3484
	  if (speed_option_verbose >= 3)
Packit 5c3484
	    gmp_printf("size=%ld reps=%u r=%Md attempt=%d  %.9f\n",
Packit 5c3484
		       (long) s->size, s->reps, s->r, i, t[i]);
Packit 5c3484
Packit 5c3484
	  if (t[i] == 0.0)
Packit 5c3484
	    {
Packit 5c3484
	      zeros++;
Packit 5c3484
	      if (zeros > max_zeros)
Packit 5c3484
		{
Packit 5c3484
		  fprintf (stderr, "Fatal error: too many (%d) failed measurements (0.0)\n", zeros);
Packit 5c3484
		  abort ();
Packit 5c3484
		}
Packit 5c3484
	     if (s->reps < 10000)
Packit 5c3484
	       s->reps *= 2;
Packit 5c3484
Packit 5c3484
	      continue;
Packit 5c3484
	    }
Packit 5c3484
Packit 5c3484
	  if (t[i] == -1.0)
Packit 5c3484
	    return -1.0;
Packit 5c3484
Packit 5c3484
	  if (t[i] >= speed_unittime * speed_precision)
Packit 5c3484
	    break;
Packit 5c3484
Packit 5c3484
	  /* go to a value of reps to make t[i] >= precision */
Packit 5c3484
	  reps_d = ceil (1.1 * s->reps
Packit 5c3484
			 * speed_unittime * speed_precision
Packit 5c3484
			 / MAX (t[i], speed_unittime));
Packit 5c3484
	  if (reps_d > 2e9 || reps_d < 1.0)
Packit 5c3484
	    {
Packit 5c3484
	      fprintf (stderr, "Fatal error: new reps bad: %.2f\n", reps_d);
Packit 5c3484
	      fprintf (stderr, "  (old reps %u, unittime %.4g, precision %d, t[i] %.4g)\n",
Packit 5c3484
		       s->reps, speed_unittime, speed_precision, t[i]);
Packit 5c3484
	      abort ();
Packit 5c3484
	    }
Packit 5c3484
	  s->reps = (unsigned) reps_d;
Packit 5c3484
	}
Packit 5c3484
      t[i] /= s->reps;
Packit 5c3484
      t_unsorted[i] = t[i];
Packit 5c3484
Packit 5c3484
      if (speed_precision == 0)
Packit 5c3484
	return t[i];
Packit 5c3484
Packit 5c3484
      /* require 3 values within TOLERANCE when >= 2 secs, 4 when below */
Packit 5c3484
      if (t[0] >= 2.0)
Packit 5c3484
	e = 3;
Packit 5c3484
      else
Packit 5c3484
	e = 4;
Packit 5c3484
Packit 5c3484
      /* Look for e many t[]'s within TOLERANCE of each other to consider a
Packit 5c3484
	 valid measurement.  Return smallest among them.  */
Packit 5c3484
      if (i >= e)
Packit 5c3484
	{
Packit 5c3484
	  qsort (t, i+1, sizeof(t[0]), (qsort_function_t) double_cmp_ptr);
Packit 5c3484
	  for (j = e-1; j < i; j++)
Packit 5c3484
	    if (t[j] <= t[j-e+1] * TOLERANCE)
Packit 5c3484
	      return t[j-e+1] / s->time_divisor;
Packit 5c3484
	}
Packit 5c3484
    }
Packit 5c3484
Packit 5c3484
  fprintf (stderr, "speed_measure() could not get %d results within %.1f%%\n",
Packit 5c3484
	   e, (TOLERANCE-1.0)*100.0);
Packit 5c3484
  fprintf (stderr, "    unsorted         sorted\n");
Packit 5c3484
  fprintf (stderr, "  %.12f    %.12f    is about 0.5%%\n",
Packit 5c3484
	   t_unsorted[0]*(TOLERANCE-1.0), t[0]*(TOLERANCE-1.0));
Packit 5c3484
  for (i = 0; i < numberof (t); i++)
Packit 5c3484
    fprintf (stderr, "  %.09f       %.09f\n", t_unsorted[i], t[i]);
Packit 5c3484
Packit 5c3484
  return -1.0;
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
Packit 5c3484
/* Read all of ptr,size to get it into the CPU memory cache.
Packit 5c3484
Packit 5c3484
   A call to mpn_cache_fill_dummy() is used to make sure the compiler
Packit 5c3484
   doesn't optimize away the whole loop.  Using "volatile mp_limb_t sum"
Packit 5c3484
   would work too, but the function call means we don't rely on every
Packit 5c3484
   compiler actually implementing volatile properly.
Packit 5c3484
Packit 5c3484
   mpn_cache_fill_dummy() is in a separate source file to stop gcc thinking
Packit 5c3484
   it can inline it.  */
Packit 5c3484
Packit 5c3484
void
Packit 5c3484
mpn_cache_fill (mp_srcptr ptr, mp_size_t size)
Packit 5c3484
{
Packit 5c3484
  mp_limb_t  sum = 0;
Packit 5c3484
  mp_size_t  i;
Packit 5c3484
Packit 5c3484
  for (i = 0; i < size; i++)
Packit 5c3484
    sum += ptr[i];
Packit 5c3484
Packit 5c3484
  mpn_cache_fill_dummy(sum);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
Packit 5c3484
void
Packit 5c3484
mpn_cache_fill_write (mp_ptr ptr, mp_size_t size)
Packit 5c3484
{
Packit 5c3484
  mpn_cache_fill (ptr, size);
Packit 5c3484
Packit 5c3484
#if 0
Packit 5c3484
  mpn_random (ptr, size);
Packit 5c3484
#endif
Packit 5c3484
Packit 5c3484
#if 0
Packit 5c3484
  mp_size_t  i;
Packit 5c3484
Packit 5c3484
  for (i = 0; i < size; i++)
Packit 5c3484
    ptr[i] = i;
Packit 5c3484
#endif
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
Packit 5c3484
void
Packit 5c3484
speed_operand_src (struct speed_params *s, mp_ptr ptr, mp_size_t size)
Packit 5c3484
{
Packit 5c3484
  if (s->src_num >= numberof (s->src))
Packit 5c3484
    {
Packit 5c3484
      fprintf (stderr, "speed_operand_src: no room left in s->src[]\n");
Packit 5c3484
      abort ();
Packit 5c3484
    }
Packit 5c3484
  s->src[s->src_num].ptr = ptr;
Packit 5c3484
  s->src[s->src_num].size = size;
Packit 5c3484
  s->src_num++;
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
Packit 5c3484
void
Packit 5c3484
speed_operand_dst (struct speed_params *s, mp_ptr ptr, mp_size_t size)
Packit 5c3484
{
Packit 5c3484
  if (s->dst_num >= numberof (s->dst))
Packit 5c3484
    {
Packit 5c3484
      fprintf (stderr, "speed_operand_dst: no room left in s->dst[]\n");
Packit 5c3484
      abort ();
Packit 5c3484
    }
Packit 5c3484
  s->dst[s->dst_num].ptr = ptr;
Packit 5c3484
  s->dst[s->dst_num].size = size;
Packit 5c3484
  s->dst_num++;
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
Packit 5c3484
void
Packit 5c3484
speed_cache_fill (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  static struct speed_params  prev;
Packit 5c3484
  int  i;
Packit 5c3484
Packit 5c3484
  /* FIXME: need a better way to get the format string for a pointer */
Packit 5c3484
Packit 5c3484
  if (speed_option_addrs)
Packit 5c3484
    {
Packit 5c3484
      int  different;
Packit 5c3484
Packit 5c3484
      different = (s->dst_num != prev.dst_num || s->src_num != prev.src_num);
Packit 5c3484
      for (i = 0; i < s->dst_num; i++)
Packit 5c3484
	different |= (s->dst[i].ptr != prev.dst[i].ptr);
Packit 5c3484
      for (i = 0; i < s->src_num; i++)
Packit 5c3484
	different |= (s->src[i].ptr != prev.src[i].ptr);
Packit 5c3484
Packit 5c3484
      if (different)
Packit 5c3484
	{
Packit 5c3484
	  if (s->dst_num != 0)
Packit 5c3484
	    {
Packit 5c3484
	      printf ("dst");
Packit 5c3484
	      for (i = 0; i < s->dst_num; i++)
Packit 5c3484
		printf (" %08lX", (unsigned long) s->dst[i].ptr);
Packit 5c3484
	      printf (" ");
Packit 5c3484
	    }
Packit 5c3484
Packit 5c3484
	  if (s->src_num != 0)
Packit 5c3484
	    {
Packit 5c3484
	      printf ("src");
Packit 5c3484
	      for (i = 0; i < s->src_num; i++)
Packit 5c3484
		printf (" %08lX", (unsigned long) s->src[i].ptr);
Packit 5c3484
	      printf (" ");
Packit 5c3484
	    }
Packit 5c3484
	  printf ("  (cf sp approx %08lX)\n", (unsigned long) &different);
Packit 5c3484
Packit 5c3484
	}
Packit 5c3484
Packit 5c3484
      memcpy (&prev, s, sizeof(prev));
Packit 5c3484
    }
Packit 5c3484
Packit 5c3484
  switch (s->cache) {
Packit 5c3484
  case 0:
Packit 5c3484
    for (i = 0; i < s->dst_num; i++)
Packit 5c3484
      mpn_cache_fill_write (s->dst[i].ptr, s->dst[i].size);
Packit 5c3484
    for (i = 0; i < s->src_num; i++)
Packit 5c3484
      mpn_cache_fill (s->src[i].ptr, s->src[i].size);
Packit 5c3484
    break;
Packit 5c3484
  case 1:
Packit 5c3484
    pentium_wbinvd();
Packit 5c3484
    break;
Packit 5c3484
  }
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
Packit 5c3484
/* Miscellaneous options accepted by tune and speed programs under -o. */
Packit 5c3484
Packit 5c3484
void
Packit 5c3484
speed_option_set (const char *s)
Packit 5c3484
{
Packit 5c3484
  int  n;
Packit 5c3484
Packit 5c3484
  if (strcmp (s, "addrs") == 0)
Packit 5c3484
    {
Packit 5c3484
      speed_option_addrs = 1;
Packit 5c3484
    }
Packit 5c3484
  else if (strcmp (s, "verbose") == 0)
Packit 5c3484
    {
Packit 5c3484
      speed_option_verbose++;
Packit 5c3484
    }
Packit 5c3484
  else if (sscanf (s, "verbose=%d", &n) == 1)
Packit 5c3484
    {
Packit 5c3484
      speed_option_verbose = n;
Packit 5c3484
    }
Packit 5c3484
  else if (strcmp (s, "cycles-broken") == 0)
Packit 5c3484
    {
Packit 5c3484
      speed_option_cycles_broken = 1;
Packit 5c3484
    }
Packit 5c3484
  else
Packit 5c3484
    {
Packit 5c3484
      printf ("Unrecognised -o option: %s\n", s);
Packit 5c3484
      exit (1);
Packit 5c3484
    }
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
Packit 5c3484
/* The following are basic speed running routines for various gmp functions.
Packit 5c3484
   Many are very similar and use speed.h macros.
Packit 5c3484
Packit 5c3484
   Each routine allocates it's own destination space for the result of the
Packit 5c3484
   function, because only it can know what the function needs.
Packit 5c3484
Packit 5c3484
   speed_starttime() and speed_endtime() are put tight around the code to be
Packit 5c3484
   measured.  Any setups are done outside the timed portion.
Packit 5c3484
Packit 5c3484
   Each routine is responsible for its own cache priming.
Packit 5c3484
   speed_cache_fill() is a good way to do this, see examples in speed.h.
Packit 5c3484
   One cache priming possibility, for CPUs with write-allocate cache, and
Packit 5c3484
   functions that don't take too long, is to do one dummy call before timing
Packit 5c3484
   so as to cache everything that gets used.  But speed_measure() runs a
Packit 5c3484
   routine at least twice and will take the smaller time, so this might not
Packit 5c3484
   be necessary.
Packit 5c3484
Packit 5c3484
   Data alignment will be important, for source, destination and temporary
Packit 5c3484
   workspace.  A routine can align its destination and workspace.  Programs
Packit 5c3484
   using the routines will ensure s->xp and s->yp are aligned.  Aligning
Packit 5c3484
   onto a CACHE_LINE_SIZE boundary is suggested.  s->align_wp and
Packit 5c3484
   s->align_wp2 should be respected where it makes sense to do so.
Packit 5c3484
   SPEED_TMP_ALLOC_LIMBS is a good way to do this.
Packit 5c3484
Packit 5c3484
   A loop of the following form can be expected to turn into good assembler
Packit 5c3484
   code on most CPUs, thereby minimizing overhead in the measurement.  It
Packit 5c3484
   can always be assumed s->reps >= 1.
Packit 5c3484
Packit 5c3484
	  i = s->reps
Packit 5c3484
	  do
Packit 5c3484
	    foo();
Packit 5c3484
	  while (--i != 0);
Packit 5c3484
Packit 5c3484
   Additional parameters might be added to "struct speed_params" in the
Packit 5c3484
   future.  Routines should ignore anything they don't use.
Packit 5c3484
Packit 5c3484
   s->size can be used creatively, and s->xp and s->yp can be ignored.  For
Packit 5c3484
   example, speed_mpz_fac_ui() uses s->size as n for the factorial.  s->r is
Packit 5c3484
   just a user-supplied parameter.  speed_mpn_lshift() uses it as a shift,
Packit 5c3484
   speed_mpn_mul_1() uses it as a multiplier.  */
Packit 5c3484
Packit 5c3484
Packit 5c3484
/* MPN_COPY etc can be macros, so the _CALL forms are necessary */
Packit 5c3484
double
Packit 5c3484
speed_MPN_COPY (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_COPY (MPN_COPY);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_MPN_COPY_INCR (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_COPY (MPN_COPY_INCR);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_MPN_COPY_DECR (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_COPY (MPN_COPY_DECR);
Packit 5c3484
}
Packit 5c3484
#if HAVE_NATIVE_mpn_copyi
Packit 5c3484
double
Packit 5c3484
speed_mpn_copyi (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_COPY (mpn_copyi);
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
#if HAVE_NATIVE_mpn_copyd
Packit 5c3484
double
Packit 5c3484
speed_mpn_copyd (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_COPY (mpn_copyd);
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
double
Packit 5c3484
speed_memcpy (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_COPY_BYTES (memcpy);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_com (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_COPY (mpn_com);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_neg (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_COPY (mpn_neg);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_sec_tabselect (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_TABSELECT (mpn_sec_tabselect);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_addmul_1 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_UNARY_1 (mpn_addmul_1);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_submul_1 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_UNARY_1 (mpn_submul_1);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
#if HAVE_NATIVE_mpn_addmul_2
Packit 5c3484
double
Packit 5c3484
speed_mpn_addmul_2 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_UNARY_2 (mpn_addmul_2);
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
#if HAVE_NATIVE_mpn_addmul_3
Packit 5c3484
double
Packit 5c3484
speed_mpn_addmul_3 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_UNARY_3 (mpn_addmul_3);
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
#if HAVE_NATIVE_mpn_addmul_4
Packit 5c3484
double
Packit 5c3484
speed_mpn_addmul_4 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_UNARY_4 (mpn_addmul_4);
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
#if HAVE_NATIVE_mpn_addmul_5
Packit 5c3484
double
Packit 5c3484
speed_mpn_addmul_5 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_UNARY_5 (mpn_addmul_5);
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
#if HAVE_NATIVE_mpn_addmul_6
Packit 5c3484
double
Packit 5c3484
speed_mpn_addmul_6 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_UNARY_6 (mpn_addmul_6);
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
#if HAVE_NATIVE_mpn_addmul_7
Packit 5c3484
double
Packit 5c3484
speed_mpn_addmul_7 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_UNARY_7 (mpn_addmul_7);
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
#if HAVE_NATIVE_mpn_addmul_8
Packit 5c3484
double
Packit 5c3484
speed_mpn_addmul_8 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_UNARY_8 (mpn_addmul_8);
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_mul_1 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_UNARY_1 (mpn_mul_1);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_mul_1_inplace (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_UNARY_1_INPLACE (mpn_mul_1);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
#if HAVE_NATIVE_mpn_mul_2
Packit 5c3484
double
Packit 5c3484
speed_mpn_mul_2 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_UNARY_2 (mpn_mul_2);
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
#if HAVE_NATIVE_mpn_mul_3
Packit 5c3484
double
Packit 5c3484
speed_mpn_mul_3 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_UNARY_3 (mpn_mul_3);
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
#if HAVE_NATIVE_mpn_mul_4
Packit 5c3484
double
Packit 5c3484
speed_mpn_mul_4 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_UNARY_4 (mpn_mul_4);
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
#if HAVE_NATIVE_mpn_mul_5
Packit 5c3484
double
Packit 5c3484
speed_mpn_mul_5 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_UNARY_5 (mpn_mul_5);
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
#if HAVE_NATIVE_mpn_mul_6
Packit 5c3484
double
Packit 5c3484
speed_mpn_mul_6 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_UNARY_6 (mpn_mul_6);
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_lshift (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_UNARY_1 (mpn_lshift);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_lshiftc (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_UNARY_1 (mpn_lshiftc);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_rshift (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_UNARY_1 (mpn_rshift);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
Packit 5c3484
/* The carry-in variants (if available) are good for measuring because they
Packit 5c3484
   won't skip a division if high
Packit 5c3484
   with the plain _1 forms. */
Packit 5c3484
double
Packit 5c3484
speed_mpn_divrem_1 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_DIVREM_1 (mpn_divrem_1);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_divrem_1f (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_DIVREM_1F (mpn_divrem_1);
Packit 5c3484
}
Packit 5c3484
#if HAVE_NATIVE_mpn_divrem_1c
Packit 5c3484
double
Packit 5c3484
speed_mpn_divrem_1c (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_DIVREM_1C (mpn_divrem_1c);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_divrem_1cf (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_DIVREM_1CF (mpn_divrem_1c);
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_divrem_1_div (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_DIVREM_1 (mpn_divrem_1_div);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_divrem_1f_div (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_DIVREM_1F (mpn_divrem_1_div);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_divrem_1_inv (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_DIVREM_1 (mpn_divrem_1_inv);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_divrem_1f_inv (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_DIVREM_1F (mpn_divrem_1_inv);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_mod_1_div (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_MOD_1 (mpn_mod_1_div);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_mod_1_inv (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_MOD_1 (mpn_mod_1_inv);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_preinv_divrem_1 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_PREINV_DIVREM_1 (mpn_preinv_divrem_1);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_preinv_divrem_1f (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_PREINV_DIVREM_1F (mpn_preinv_divrem_1);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
#if GMP_NUMB_BITS % 4 == 0
Packit 5c3484
double
Packit 5c3484
speed_mpn_mod_34lsub1 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_MOD_34LSUB1 (mpn_mod_34lsub1);
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_divrem_2 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_DIVREM_2 (mpn_divrem_2);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_divrem_2_div (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_DIVREM_2 (mpn_divrem_2_div);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_divrem_2_inv (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_DIVREM_2 (mpn_divrem_2_inv);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_div_qr_1n_pi1 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_DIV_QR_1N_PI1 (mpn_div_qr_1n_pi1);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_div_qr_1n_pi1_1 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_DIV_QR_1N_PI1 (mpn_div_qr_1n_pi1_1);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_div_qr_1n_pi1_2 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_DIV_QR_1N_PI1 (mpn_div_qr_1n_pi1_2);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_div_qr_1 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_DIV_QR_1 (mpn_div_qr_1);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_div_qr_2n (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_DIV_QR_2 (mpn_div_qr_2, 1);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_div_qr_2u (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_DIV_QR_2 (mpn_div_qr_2, 0);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_mod_1 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_MOD_1 (mpn_mod_1);
Packit 5c3484
}
Packit 5c3484
#if HAVE_NATIVE_mpn_mod_1c
Packit 5c3484
double
Packit 5c3484
speed_mpn_mod_1c (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_MOD_1C (mpn_mod_1c);
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
double
Packit 5c3484
speed_mpn_preinv_mod_1 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_PREINV_MOD_1 (mpn_preinv_mod_1);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_mod_1_1 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_MOD_1_1 (mpn_mod_1_1p,mpn_mod_1_1p_cps);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_mod_1_1_1 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_MOD_1_1 (mpn_mod_1_1p_1,mpn_mod_1_1p_cps_1);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_mod_1_1_2 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_MOD_1_1 (mpn_mod_1_1p_2,mpn_mod_1_1p_cps_2);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_mod_1_2 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_MOD_1_N (mpn_mod_1s_2p,mpn_mod_1s_2p_cps,2);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_mod_1_3 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_MOD_1_N (mpn_mod_1s_3p,mpn_mod_1s_3p_cps,3);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_mod_1_4 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_MOD_1_N (mpn_mod_1s_4p,mpn_mod_1s_4p_cps,4);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_divexact_1 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_DIVEXACT_1 (mpn_divexact_1);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_divexact_by3 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_COPY (mpn_divexact_by3);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_bdiv_dbm1c (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_BDIV_DBM1C (mpn_bdiv_dbm1c);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_bdiv_q_1 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_BDIV_Q_1 (mpn_bdiv_q_1);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_pi1_bdiv_q_1 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_PI1_BDIV_Q_1 (mpn_pi1_bdiv_q_1);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
#if HAVE_NATIVE_mpn_modexact_1_odd
Packit 5c3484
double
Packit 5c3484
speed_mpn_modexact_1_odd (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_MODEXACT_1_ODD (mpn_modexact_1_odd);
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_modexact_1c_odd (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_MODEXACT_1C_ODD (mpn_modexact_1c_odd);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpz_mod (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPZ_MOD (mpz_mod);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_sbpi1_div_qr (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_PI1_DIV (mpn_sbpi1_div_qr, inv.inv32, 2,0);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_dcpi1_div_qr (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_PI1_DIV (mpn_dcpi1_div_qr, &inv, 6,3);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_sbpi1_divappr_q (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_PI1_DIV (mpn_sbpi1_divappr_q, inv.inv32, 2,0);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_dcpi1_divappr_q (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_PI1_DIV (mpn_dcpi1_divappr_q, &inv, 6,3);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_mu_div_qr (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_MU_DIV_QR (mpn_mu_div_qr, mpn_mu_div_qr_itch);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_mu_divappr_q (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_MU_DIV_Q (mpn_mu_divappr_q, mpn_mu_divappr_q_itch);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_mu_div_q (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_MU_DIV_Q (mpn_mu_div_q, mpn_mu_div_q_itch);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_mupi_div_qr (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_MUPI_DIV_QR (mpn_preinv_mu_div_qr, mpn_preinv_mu_div_qr_itch);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_sbpi1_bdiv_qr (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_PI1_BDIV_QR (mpn_sbpi1_bdiv_qr);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_dcpi1_bdiv_qr (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_PI1_BDIV_QR (mpn_dcpi1_bdiv_qr);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_sbpi1_bdiv_q (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_PI1_BDIV_Q (mpn_sbpi1_bdiv_q);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_dcpi1_bdiv_q (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_PI1_BDIV_Q (mpn_dcpi1_bdiv_q);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_mu_bdiv_q (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_MU_BDIV_Q (mpn_mu_bdiv_q, mpn_mu_bdiv_q_itch);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_mu_bdiv_qr (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_MU_BDIV_QR (mpn_mu_bdiv_qr, mpn_mu_bdiv_qr_itch);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_broot (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_BROOT (mpn_broot);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_broot_invm1 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_BROOT (mpn_broot_invm1);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_brootinv (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_BROOTINV (mpn_brootinv, 5*s->size);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_binvert (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_BINVERT (mpn_binvert, mpn_binvert_itch);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_invert (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_INVERT (mpn_invert, mpn_invert_itch);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_invertappr (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_INVERTAPPR (mpn_invertappr, mpn_invertappr_itch);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_ni_invertappr (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_INVERTAPPR (mpn_ni_invertappr, mpn_invertappr_itch);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_sec_invert (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_SEC_INVERT (mpn_sec_invert, mpn_sec_invert_itch);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_redc_1 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_REDC_1 (mpn_redc_1);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_redc_2 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_REDC_2 (mpn_redc_2);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_redc_n (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_REDC_N (mpn_redc_n);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_popcount (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_POPCOUNT (mpn_popcount);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_hamdist (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_HAMDIST (mpn_hamdist);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_add_n (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_BINARY_N (mpn_add_n);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_sub_n (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
SPEED_ROUTINE_MPN_BINARY_N (mpn_sub_n);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_add_1 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_UNARY_1 (mpn_add_1);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_add_1_inplace (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_UNARY_1_INPLACE (mpn_add_1);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_sub_1 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_UNARY_1 (mpn_sub_1);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_sub_1_inplace (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_UNARY_1_INPLACE (mpn_sub_1);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_add_err1_n (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_BINARY_ERR1_N (mpn_add_err1_n);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_sub_err1_n (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_BINARY_ERR1_N (mpn_sub_err1_n);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_add_err2_n (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_BINARY_ERR2_N (mpn_add_err2_n);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_sub_err2_n (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_BINARY_ERR2_N (mpn_sub_err2_n);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_add_err3_n (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_BINARY_ERR3_N (mpn_add_err3_n);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_sub_err3_n (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_BINARY_ERR3_N (mpn_sub_err3_n);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
Packit 5c3484
#if HAVE_NATIVE_mpn_add_n_sub_n
Packit 5c3484
double
Packit 5c3484
speed_mpn_add_n_sub_n (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_ADDSUB_N_CALL (mpn_add_n_sub_n (ap, sp, s->xp, s->yp, s->size));
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
Packit 5c3484
#if HAVE_NATIVE_mpn_addlsh1_n == 1
Packit 5c3484
double
Packit 5c3484
speed_mpn_addlsh1_n (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_BINARY_N (mpn_addlsh1_n);
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
#if HAVE_NATIVE_mpn_sublsh1_n == 1
Packit 5c3484
double
Packit 5c3484
speed_mpn_sublsh1_n (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_BINARY_N (mpn_sublsh1_n);
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
#if HAVE_NATIVE_mpn_addlsh1_n_ip1
Packit 5c3484
double
Packit 5c3484
speed_mpn_addlsh1_n_ip1 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_COPY (mpn_addlsh1_n_ip1);
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
#if HAVE_NATIVE_mpn_addlsh1_n_ip2
Packit 5c3484
double
Packit 5c3484
speed_mpn_addlsh1_n_ip2 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_COPY (mpn_addlsh1_n_ip2);
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
#if HAVE_NATIVE_mpn_sublsh1_n_ip1
Packit 5c3484
double
Packit 5c3484
speed_mpn_sublsh1_n_ip1 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_COPY (mpn_sublsh1_n_ip1);
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
#if HAVE_NATIVE_mpn_rsblsh1_n == 1
Packit 5c3484
double
Packit 5c3484
speed_mpn_rsblsh1_n (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_BINARY_N (mpn_rsblsh1_n);
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
#if HAVE_NATIVE_mpn_addlsh2_n == 1
Packit 5c3484
double
Packit 5c3484
speed_mpn_addlsh2_n (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_BINARY_N (mpn_addlsh2_n);
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
#if HAVE_NATIVE_mpn_sublsh2_n == 1
Packit 5c3484
double
Packit 5c3484
speed_mpn_sublsh2_n (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_BINARY_N (mpn_sublsh2_n);
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
#if HAVE_NATIVE_mpn_addlsh2_n_ip1
Packit 5c3484
double
Packit 5c3484
speed_mpn_addlsh2_n_ip1 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_COPY (mpn_addlsh2_n_ip1);
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
#if HAVE_NATIVE_mpn_addlsh2_n_ip2
Packit 5c3484
double
Packit 5c3484
speed_mpn_addlsh2_n_ip2 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_COPY (mpn_addlsh2_n_ip2);
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
#if HAVE_NATIVE_mpn_sublsh2_n_ip1
Packit 5c3484
double
Packit 5c3484
speed_mpn_sublsh2_n_ip1 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_COPY (mpn_sublsh2_n_ip1);
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
#if HAVE_NATIVE_mpn_rsblsh2_n == 1
Packit 5c3484
double
Packit 5c3484
speed_mpn_rsblsh2_n (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_BINARY_N (mpn_rsblsh2_n);
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
#if HAVE_NATIVE_mpn_addlsh_n
Packit 5c3484
double
Packit 5c3484
speed_mpn_addlsh_n (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_BINARY_N_CALL (mpn_addlsh_n (wp, xp, yp, s->size, 7));
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
#if HAVE_NATIVE_mpn_sublsh_n
Packit 5c3484
double
Packit 5c3484
speed_mpn_sublsh_n (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_BINARY_N_CALL (mpn_sublsh_n (wp, xp, yp, s->size, 7));
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
#if HAVE_NATIVE_mpn_addlsh_n_ip1
Packit 5c3484
double
Packit 5c3484
speed_mpn_addlsh_n_ip1 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_UNARY_1_CALL (mpn_addlsh_n_ip1 (wp, s->xp, s->size, 7));
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
#if HAVE_NATIVE_mpn_addlsh_n_ip2
Packit 5c3484
double
Packit 5c3484
speed_mpn_addlsh_n_ip2 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_UNARY_1_CALL (mpn_addlsh_n_ip2 (wp, s->xp, s->size, 7));
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
#if HAVE_NATIVE_mpn_sublsh_n_ip1
Packit 5c3484
double
Packit 5c3484
speed_mpn_sublsh_n_ip1 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_UNARY_1_CALL (mpn_sublsh_n_ip1 (wp, s->xp, s->size, 7));
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
#if HAVE_NATIVE_mpn_rsblsh_n
Packit 5c3484
double
Packit 5c3484
speed_mpn_rsblsh_n (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_BINARY_N_CALL (mpn_rsblsh_n (wp, xp, yp, s->size, 7));
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
#if HAVE_NATIVE_mpn_rsh1add_n
Packit 5c3484
double
Packit 5c3484
speed_mpn_rsh1add_n (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_BINARY_N (mpn_rsh1add_n);
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
#if HAVE_NATIVE_mpn_rsh1sub_n
Packit 5c3484
double
Packit 5c3484
speed_mpn_rsh1sub_n (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_BINARY_N (mpn_rsh1sub_n);
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_cnd_add_n (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_BINARY_N_CALL (mpn_cnd_add_n (1, wp, xp, yp, s->size));
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_cnd_sub_n (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_BINARY_N_CALL (mpn_cnd_sub_n (1, wp, xp, yp, s->size));
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
/* mpn_and_n etc can be macros and so have to be handled with
Packit 5c3484
   SPEED_ROUTINE_MPN_BINARY_N_CALL forms */
Packit 5c3484
double
Packit 5c3484
speed_mpn_and_n (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_BINARY_N_CALL (mpn_and_n (wp, xp, yp, s->size));
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_andn_n (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_BINARY_N_CALL (mpn_andn_n (wp, xp, yp, s->size));
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_nand_n (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_BINARY_N_CALL (mpn_nand_n (wp, xp, yp, s->size));
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_ior_n (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_BINARY_N_CALL (mpn_ior_n (wp, xp, yp, s->size));
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_iorn_n (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_BINARY_N_CALL (mpn_iorn_n (wp, xp, yp, s->size));
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_nior_n (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_BINARY_N_CALL (mpn_nior_n (wp, xp, yp, s->size));
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_xor_n (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_BINARY_N_CALL (mpn_xor_n (wp, xp, yp, s->size));
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_xnor_n (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_BINARY_N_CALL (mpn_xnor_n (wp, xp, yp, s->size));
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_mul_n (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_MUL_N (mpn_mul_n);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_sqr (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_SQR (mpn_sqr);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_mul_n_sqr (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_SQR_CALL (mpn_mul_n (wp, s->xp, s->xp, s->size));
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_mul_basecase (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_MUL(mpn_mul_basecase);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_mul (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_MUL(mpn_mul);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_sqr_basecase (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  /* FIXME: size restrictions on some versions of sqr_basecase */
Packit 5c3484
  SPEED_ROUTINE_MPN_SQR (mpn_sqr_basecase);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
#if HAVE_NATIVE_mpn_sqr_diagonal
Packit 5c3484
double
Packit 5c3484
speed_mpn_sqr_diagonal (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_SQR (mpn_sqr_diagonal);
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
Packit 5c3484
#if HAVE_NATIVE_mpn_sqr_diag_addlsh1
Packit 5c3484
double
Packit 5c3484
speed_mpn_sqr_diag_addlsh1 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_SQR_DIAG_ADDLSH1_CALL (mpn_sqr_diag_addlsh1 (wp, tp, s->xp, s->size));
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_toom2_sqr (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_TOOM2_SQR (mpn_toom2_sqr);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_toom3_sqr (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_TOOM3_SQR (mpn_toom3_sqr);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_toom4_sqr (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_TOOM4_SQR (mpn_toom4_sqr);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_toom6_sqr (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_TOOM6_SQR (mpn_toom6_sqr);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_toom8_sqr (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_TOOM8_SQR (mpn_toom8_sqr);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_toom22_mul (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_TOOM22_MUL_N (mpn_toom22_mul);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_toom33_mul (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_TOOM33_MUL_N (mpn_toom33_mul);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_toom44_mul (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_TOOM44_MUL_N (mpn_toom44_mul);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_toom6h_mul (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_TOOM6H_MUL_N (mpn_toom6h_mul);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_toom8h_mul (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_TOOM8H_MUL_N (mpn_toom8h_mul);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_toom32_mul (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_TOOM32_MUL (mpn_toom32_mul);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_toom42_mul (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_TOOM42_MUL (mpn_toom42_mul);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_toom43_mul (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_TOOM43_MUL (mpn_toom43_mul);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_toom63_mul (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_TOOM63_MUL (mpn_toom63_mul);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_toom32_for_toom43_mul (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_TOOM32_FOR_TOOM43_MUL (mpn_toom32_mul);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_toom43_for_toom32_mul (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_TOOM43_FOR_TOOM32_MUL (mpn_toom43_mul);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_toom32_for_toom53_mul (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_TOOM32_FOR_TOOM53_MUL (mpn_toom32_mul);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_toom53_for_toom32_mul (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_TOOM53_FOR_TOOM32_MUL (mpn_toom53_mul);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_toom42_for_toom53_mul (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_TOOM42_FOR_TOOM53_MUL (mpn_toom42_mul);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_toom53_for_toom42_mul (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_TOOM53_FOR_TOOM42_MUL (mpn_toom53_mul);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_toom43_for_toom54_mul (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_TOOM43_FOR_TOOM54_MUL (mpn_toom43_mul);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_toom54_for_toom43_mul (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_TOOM54_FOR_TOOM43_MUL (mpn_toom54_mul);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_nussbaumer_mul (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_MUL_N_CALL
Packit 5c3484
    (mpn_nussbaumer_mul (wp, s->xp, s->size, s->yp, s->size));
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_nussbaumer_mul_sqr (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_SQR_CALL
Packit 5c3484
    (mpn_nussbaumer_mul (wp, s->xp, s->size, s->xp, s->size));
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
#if WANT_OLD_FFT_FULL
Packit 5c3484
double
Packit 5c3484
speed_mpn_mul_fft_full (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_MUL_N_CALL
Packit 5c3484
    (mpn_mul_fft_full (wp, s->xp, s->size, s->yp, s->size));
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_mul_fft_full_sqr (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_SQR_CALL
Packit 5c3484
    (mpn_mul_fft_full (wp, s->xp, s->size, s->xp, s->size));
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
Packit 5c3484
/* These are mod 2^N+1 multiplies and squares.  If s->r is supplied it's
Packit 5c3484
   used as k, otherwise the best k for the size is used.  If s->size isn't a
Packit 5c3484
   multiple of 2^k it's rounded up to make the effective operation size.  */
Packit 5c3484
Packit 5c3484
#define SPEED_ROUTINE_MPN_MUL_FFT_CALL(call, sqr)       \
Packit 5c3484
  {                                                     \
Packit 5c3484
    mp_ptr     wp;                                      \
Packit 5c3484
    mp_size_t  pl;                                      \
Packit 5c3484
    int        k;                                       \
Packit 5c3484
    unsigned   i;                                       \
Packit 5c3484
    double     t;                                       \
Packit 5c3484
    TMP_DECL;                                           \
Packit 5c3484
							\
Packit 5c3484
    SPEED_RESTRICT_COND (s->size >= 1);                 \
Packit 5c3484
							\
Packit 5c3484
    if (s->r != 0)                                      \
Packit 5c3484
      k = s->r;                                         \
Packit 5c3484
    else                                                \
Packit 5c3484
      k = mpn_fft_best_k (s->size, sqr);                \
Packit 5c3484
							\
Packit 5c3484
    TMP_MARK;                                           \
Packit 5c3484
    pl = mpn_fft_next_size (s->size, k);                \
Packit 5c3484
    SPEED_TMP_ALLOC_LIMBS (wp, pl+1, s->align_wp);      \
Packit 5c3484
							\
Packit 5c3484
    speed_operand_src (s, s->xp, s->size);              \
Packit 5c3484
    if (!sqr)                                           \
Packit 5c3484
      speed_operand_src (s, s->yp, s->size);            \
Packit 5c3484
    speed_operand_dst (s, wp, pl+1);                    \
Packit 5c3484
    speed_cache_fill (s);                               \
Packit 5c3484
							\
Packit 5c3484
    speed_starttime ();                                 \
Packit 5c3484
    i = s->reps;                                        \
Packit 5c3484
    do                                                  \
Packit 5c3484
      call;                                             \
Packit 5c3484
    while (--i != 0);                                   \
Packit 5c3484
    t = speed_endtime ();                               \
Packit 5c3484
							\
Packit 5c3484
    TMP_FREE;                                           \
Packit 5c3484
    return t;                                           \
Packit 5c3484
  }
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_mul_fft (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_MUL_FFT_CALL
Packit 5c3484
    (mpn_mul_fft (wp, pl, s->xp, s->size, s->yp, s->size, k), 0);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_mul_fft_sqr (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_MUL_FFT_CALL
Packit 5c3484
    (mpn_mul_fft (wp, pl, s->xp, s->size, s->xp, s->size, k), 1);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_fft_mul (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_MUL_N_CALL (mpn_fft_mul (wp, s->xp, s->size, s->yp, s->size));
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_fft_sqr (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_SQR_CALL (mpn_fft_mul (wp, s->xp, s->size, s->xp, s->size));
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_sqrlo (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_SQRLO (mpn_sqrlo);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_sqrlo_basecase (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_SQRLO (mpn_sqrlo_basecase);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_mullo_n (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_MULLO_N (mpn_mullo_n);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_mullo_basecase (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_MULLO_BASECASE (mpn_mullo_basecase);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_mulmid_basecase (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_MULMID (mpn_mulmid_basecase);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_mulmid (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_MULMID (mpn_mulmid);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_mulmid_n (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_MULMID_N (mpn_mulmid_n);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_toom42_mulmid (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_TOOM42_MULMID (mpn_toom42_mulmid);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_mulmod_bnm1 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_MULMOD_BNM1_CALL (mpn_mulmod_bnm1 (wp, s->size, s->xp, s->size, s->yp, s->size, tp));
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_bc_mulmod_bnm1 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_MULMOD_BNM1_CALL (mpn_bc_mulmod_bnm1 (wp, s->xp, s->yp, s->size, tp));
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_mulmod_bnm1_rounded (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_MULMOD_BNM1_ROUNDED (mpn_mulmod_bnm1);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_sqrmod_bnm1 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_MULMOD_BNM1_CALL (mpn_sqrmod_bnm1 (wp, s->size, s->xp, s->size, tp));
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_matrix22_mul (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  /* Speed params only includes 2 inputs, so we have to invent the
Packit 5c3484
     other 6. */
Packit 5c3484
Packit 5c3484
  mp_ptr a;
Packit 5c3484
  mp_ptr r;
Packit 5c3484
  mp_ptr b;
Packit 5c3484
  mp_ptr tp;
Packit 5c3484
  mp_size_t itch;
Packit 5c3484
  unsigned i;
Packit 5c3484
  double t;
Packit 5c3484
  TMP_DECL;
Packit 5c3484
Packit 5c3484
  TMP_MARK;
Packit 5c3484
  SPEED_TMP_ALLOC_LIMBS (a, 4 * s->size, s->align_xp);
Packit 5c3484
  SPEED_TMP_ALLOC_LIMBS (b, 4 * s->size, s->align_yp);
Packit 5c3484
  SPEED_TMP_ALLOC_LIMBS (r, 8 * s->size + 4, s->align_wp);
Packit 5c3484
Packit 5c3484
  MPN_COPY (a, s->xp, s->size);
Packit 5c3484
  mpn_random (a + s->size, 3 * s->size);
Packit 5c3484
  MPN_COPY (b, s->yp, s->size);
Packit 5c3484
  mpn_random (b + s->size, 3 * s->size);
Packit 5c3484
Packit 5c3484
  itch = mpn_matrix22_mul_itch (s->size, s->size);
Packit 5c3484
  SPEED_TMP_ALLOC_LIMBS (tp, itch, s->align_wp2);
Packit 5c3484
Packit 5c3484
  speed_operand_src (s, a, 4 * s->size);
Packit 5c3484
  speed_operand_src (s, b, 4 * s->size);
Packit 5c3484
  speed_operand_dst (s, r, 8 * s->size + 4);
Packit 5c3484
  speed_operand_dst (s, tp, itch);
Packit 5c3484
  speed_cache_fill (s);
Packit 5c3484
Packit 5c3484
  speed_starttime ();
Packit 5c3484
  i = s->reps;
Packit 5c3484
  do
Packit 5c3484
    {
Packit 5c3484
      mp_size_t sz = s->size;
Packit 5c3484
      MPN_COPY (r + 0 * sz + 0, a + 0 * sz, sz);
Packit 5c3484
      MPN_COPY (r + 2 * sz + 1, a + 1 * sz, sz);
Packit 5c3484
      MPN_COPY (r + 4 * sz + 2, a + 2 * sz, sz);
Packit 5c3484
      MPN_COPY (r + 6 * sz + 3, a + 3 * sz, sz);
Packit 5c3484
      mpn_matrix22_mul (r, r + 2 * sz + 1, r + 4 * sz + 2, r + 6 * sz + 3, sz,
Packit 5c3484
			b, b + 1 * sz,     b + 2 * sz,     b + 3 * sz,     sz,
Packit 5c3484
			tp);
Packit 5c3484
    }
Packit 5c3484
  while (--i != 0);
Packit 5c3484
  t = speed_endtime();
Packit 5c3484
  TMP_FREE;
Packit 5c3484
  return t;
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_hgcd (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_HGCD_CALL (mpn_hgcd, mpn_hgcd_itch);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_hgcd_lehmer (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_HGCD_CALL (mpn_hgcd_lehmer, mpn_hgcd_lehmer_itch);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_hgcd_appr (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_HGCD_CALL (mpn_hgcd_appr, mpn_hgcd_appr_itch);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_hgcd_appr_lehmer (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_HGCD_CALL (mpn_hgcd_appr_lehmer, mpn_hgcd_appr_lehmer_itch);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_hgcd_reduce (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_HGCD_REDUCE_CALL (mpn_hgcd_reduce, mpn_hgcd_reduce_itch);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_hgcd_reduce_1 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_HGCD_REDUCE_CALL (mpn_hgcd_reduce_1, mpn_hgcd_reduce_1_itch);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_hgcd_reduce_2 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_HGCD_REDUCE_CALL (mpn_hgcd_reduce_2, mpn_hgcd_reduce_2_itch);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_gcd (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_GCD (mpn_gcd);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_gcdext (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_GCDEXT (mpn_gcdext);
Packit 5c3484
}
Packit 5c3484
#if 0
Packit 5c3484
double
Packit 5c3484
speed_mpn_gcdext_lehmer (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_GCDEXT (__gmpn_gcdext_lehmer);
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
double
Packit 5c3484
speed_mpn_gcdext_single (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_GCDEXT (mpn_gcdext_single);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_gcdext_double (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_GCDEXT (mpn_gcdext_double);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_gcdext_one_single (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_GCDEXT_ONE (mpn_gcdext_one_single);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_gcdext_one_double (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_GCDEXT_ONE (mpn_gcdext_one_double);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_gcd_1 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_GCD_1 (mpn_gcd_1);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_gcd_1N (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_GCD_1N (mpn_gcd_1);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpz_jacobi (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPZ_JACOBI (mpz_jacobi);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_jacobi_base (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_JACBASE (mpn_jacobi_base);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_jacobi_base_1 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_JACBASE (mpn_jacobi_base_1);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_jacobi_base_2 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_JACBASE (mpn_jacobi_base_2);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_jacobi_base_3 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_JACBASE (mpn_jacobi_base_3);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_jacobi_base_4 (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_JACBASE (mpn_jacobi_base_4);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_sqrtrem (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_SQRTROOT_CALL (mpn_sqrtrem (wp, wp2, s->xp, s->size));
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_sqrt (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_SQRTROOT_CALL (mpn_sqrtrem (wp, NULL, s->xp, s->size));
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_rootrem (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_SQRTROOT_CALL (mpn_rootrem (wp, wp2, s->xp, s->size, s->r));
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_root (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_SQRTROOT_CALL (mpn_rootrem (wp, NULL, s->xp, s->size, s->r));
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpz_fac_ui (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPZ_FAC_UI (mpz_fac_ui);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpz_2fac_ui (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPZ_UI (mpz_2fac_ui);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_fib2_ui (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_FIB2_UI (mpn_fib2_ui);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpz_fib_ui (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPZ_FIB_UI (mpz_fib_ui);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpz_fib2_ui (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPZ_FIB2_UI (mpz_fib2_ui);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpz_lucnum_ui (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPZ_LUCNUM_UI (mpz_lucnum_ui);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpz_lucnum2_ui (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPZ_LUCNUM2_UI (mpz_lucnum2_ui);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpz_powm (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPZ_POWM (mpz_powm);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpz_powm_mod (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPZ_POWM (mpz_powm_mod);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpz_powm_redc (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPZ_POWM (mpz_powm_redc);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpz_powm_sec (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPZ_POWM (mpz_powm_sec);
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpz_powm_ui (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPZ_POWM_UI (mpz_powm_ui);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_binvert_limb (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MODLIMB_INVERT (binvert_limb);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_noop (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  unsigned  i;
Packit 5c3484
Packit 5c3484
  speed_starttime ();
Packit 5c3484
  i = s->reps;
Packit 5c3484
  do
Packit 5c3484
    noop ();
Packit 5c3484
  while (--i != 0);
Packit 5c3484
  return speed_endtime ();
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_noop_wxs (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  mp_ptr   wp;
Packit 5c3484
  unsigned i;
Packit 5c3484
  double   t;
Packit 5c3484
  TMP_DECL;
Packit 5c3484
Packit 5c3484
  TMP_MARK;
Packit 5c3484
  wp = TMP_ALLOC_LIMBS (1);
Packit 5c3484
Packit 5c3484
  speed_starttime ();
Packit 5c3484
  i = s->reps;
Packit 5c3484
  do
Packit 5c3484
    noop_wxs (wp, s->xp, s->size);
Packit 5c3484
  while (--i != 0);
Packit 5c3484
  t = speed_endtime ();
Packit 5c3484
Packit 5c3484
  TMP_FREE;
Packit 5c3484
  return t;
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_noop_wxys (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  mp_ptr   wp;
Packit 5c3484
  unsigned i;
Packit 5c3484
  double   t;
Packit 5c3484
  TMP_DECL;
Packit 5c3484
Packit 5c3484
  TMP_MARK;
Packit 5c3484
  wp = TMP_ALLOC_LIMBS (1);
Packit 5c3484
Packit 5c3484
  speed_starttime ();
Packit 5c3484
  i = s->reps;
Packit 5c3484
  do
Packit 5c3484
    noop_wxys (wp, s->xp, s->yp, s->size);
Packit 5c3484
  while (--i != 0);
Packit 5c3484
  t = speed_endtime ();
Packit 5c3484
Packit 5c3484
  TMP_FREE;
Packit 5c3484
  return t;
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
Packit 5c3484
#define SPEED_ROUTINE_ALLOC_FREE(variables, calls)      \
Packit 5c3484
  {                                                     \
Packit 5c3484
    unsigned  i;                                        \
Packit 5c3484
    variables;                                          \
Packit 5c3484
							\
Packit 5c3484
    speed_starttime ();                                 \
Packit 5c3484
    i = s->reps;                                        \
Packit 5c3484
    do                                                  \
Packit 5c3484
      {                                                 \
Packit 5c3484
	calls;                                          \
Packit 5c3484
      }                                                 \
Packit 5c3484
    while (--i != 0);                                   \
Packit 5c3484
    return speed_endtime ();                            \
Packit 5c3484
  }
Packit 5c3484
Packit 5c3484
Packit 5c3484
/* Compare these to see how much malloc/free costs and then how much
Packit 5c3484
   __gmp_default_allocate/free and mpz_init/clear add.  mpz_init/clear or
Packit 5c3484
   mpq_init/clear will be doing a 1 limb allocate, so use that as the size
Packit 5c3484
   when including them in comparisons.  */
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_malloc_free (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  size_t  bytes = s->size * GMP_LIMB_BYTES;
Packit 5c3484
  SPEED_ROUTINE_ALLOC_FREE (void *p,
Packit 5c3484
			    p = malloc (bytes);
Packit 5c3484
			    free (p));
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_malloc_realloc_free (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  size_t  bytes = s->size * GMP_LIMB_BYTES;
Packit 5c3484
  SPEED_ROUTINE_ALLOC_FREE (void *p,
Packit 5c3484
			    p = malloc (GMP_LIMB_BYTES);
Packit 5c3484
			    p = realloc (p, bytes);
Packit 5c3484
			    free (p));
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_gmp_allocate_free (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  size_t  bytes = s->size * GMP_LIMB_BYTES;
Packit 5c3484
  SPEED_ROUTINE_ALLOC_FREE (void *p,
Packit 5c3484
			    p = (*__gmp_allocate_func) (bytes);
Packit 5c3484
			    (*__gmp_free_func) (p, bytes));
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_gmp_allocate_reallocate_free (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  size_t  bytes = s->size * GMP_LIMB_BYTES;
Packit 5c3484
  SPEED_ROUTINE_ALLOC_FREE
Packit 5c3484
    (void *p,
Packit 5c3484
     p = (*__gmp_allocate_func) (GMP_LIMB_BYTES);
Packit 5c3484
     p = (*__gmp_reallocate_func) (p, bytes, GMP_LIMB_BYTES);
Packit 5c3484
     (*__gmp_free_func) (p, bytes));
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpz_init_clear (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_ALLOC_FREE (mpz_t z,
Packit 5c3484
			    mpz_init (z);
Packit 5c3484
			    mpz_clear (z));
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpz_init_realloc_clear (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_ALLOC_FREE (mpz_t z,
Packit 5c3484
			    mpz_init (z);
Packit 5c3484
			    _mpz_realloc (z, s->size);
Packit 5c3484
			    mpz_clear (z));
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpq_init_clear (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_ALLOC_FREE (mpq_t q,
Packit 5c3484
			    mpq_init (q);
Packit 5c3484
			    mpq_clear (q));
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpf_init_clear (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_ALLOC_FREE (mpf_t f,
Packit 5c3484
			    mpf_init (f);
Packit 5c3484
			    mpf_clear (f));
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
Packit 5c3484
/* Compare this to mpn_add_n to see how much overhead mpz_add adds.  Note
Packit 5c3484
   that repeatedly calling mpz_add with the same data gives branch prediction
Packit 5c3484
   in it an advantage.  */
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpz_add (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  mpz_t     w, x, y;
Packit 5c3484
  unsigned  i;
Packit 5c3484
  double    t;
Packit 5c3484
Packit 5c3484
  mpz_init (w);
Packit 5c3484
  mpz_init (x);
Packit 5c3484
  mpz_init (y);
Packit 5c3484
Packit 5c3484
  mpz_set_n (x, s->xp, s->size);
Packit 5c3484
  mpz_set_n (y, s->yp, s->size);
Packit 5c3484
  mpz_add (w, x, y);
Packit 5c3484
Packit 5c3484
  speed_starttime ();
Packit 5c3484
  i = s->reps;
Packit 5c3484
  do
Packit 5c3484
    {
Packit 5c3484
      mpz_add (w, x, y);
Packit 5c3484
    }
Packit 5c3484
  while (--i != 0);
Packit 5c3484
  t = speed_endtime ();
Packit 5c3484
Packit 5c3484
  mpz_clear (w);
Packit 5c3484
  mpz_clear (x);
Packit 5c3484
  mpz_clear (y);
Packit 5c3484
  return t;
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
Packit 5c3484
/* If r==0, calculate (size,size/2),
Packit 5c3484
   otherwise calculate (size,r). */
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpz_bin_uiui (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  mpz_t          w;
Packit 5c3484
  unsigned long  k;
Packit 5c3484
  unsigned  i;
Packit 5c3484
  double    t;
Packit 5c3484
Packit 5c3484
  mpz_init (w);
Packit 5c3484
  if (s->r != 0)
Packit 5c3484
    k = s->r;
Packit 5c3484
  else
Packit 5c3484
    k = s->size/2;
Packit 5c3484
Packit 5c3484
  speed_starttime ();
Packit 5c3484
  i = s->reps;
Packit 5c3484
  do
Packit 5c3484
    {
Packit 5c3484
      mpz_bin_uiui (w, s->size, k);
Packit 5c3484
    }
Packit 5c3484
  while (--i != 0);
Packit 5c3484
  t = speed_endtime ();
Packit 5c3484
Packit 5c3484
  mpz_clear (w);
Packit 5c3484
  return t;
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
/* If r==0, calculate binomial(2^size,size),
Packit 5c3484
   otherwise calculate binomial(2^size,r). */
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpz_bin_ui (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  mpz_t          w, x;
Packit 5c3484
  unsigned long  k;
Packit 5c3484
  unsigned  i;
Packit 5c3484
  double    t;
Packit 5c3484
Packit 5c3484
  mpz_init (w);
Packit 5c3484
  mpz_init_set_ui (x, 0);
Packit 5c3484
Packit 5c3484
  mpz_setbit (x, s->size);
Packit 5c3484
Packit 5c3484
  if (s->r != 0)
Packit 5c3484
    k = s->r;
Packit 5c3484
  else
Packit 5c3484
    k = s->size;
Packit 5c3484
Packit 5c3484
  speed_starttime ();
Packit 5c3484
  i = s->reps;
Packit 5c3484
  do
Packit 5c3484
    {
Packit 5c3484
      mpz_bin_ui (w, x, k);
Packit 5c3484
    }
Packit 5c3484
  while (--i != 0);
Packit 5c3484
  t = speed_endtime ();
Packit 5c3484
Packit 5c3484
  mpz_clear (w);
Packit 5c3484
  mpz_clear (x);
Packit 5c3484
  return t;
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
/* The multiplies are successively dependent so the latency is measured, not
Packit 5c3484
   the issue rate.  There's only 10 per loop so the code doesn't get too big
Packit 5c3484
   since umul_ppmm is several instructions on some cpus.
Packit 5c3484
Packit 5c3484
   Putting the arguments as "h,l,l,h" gets slightly better code from gcc
Packit 5c3484
   2.95.2 on x86, it puts only one mov between each mul, not two.  That mov
Packit 5c3484
   though will probably show up as a bogus extra cycle though.
Packit 5c3484
Packit 5c3484
   The measuring function macros are into three parts to avoid overflowing
Packit 5c3484
   preprocessor expansion space if umul_ppmm is big.
Packit 5c3484
Packit 5c3484
   Limitations:
Packit 5c3484
Packit 5c3484
   Don't blindly use this to set UMUL_TIME in gmp-mparam.h, check the code
Packit 5c3484
   generated first, especially on CPUs with low latency multipliers.
Packit 5c3484
Packit 5c3484
   The default umul_ppmm doing h*l will be getting increasing numbers of
Packit 5c3484
   high zero bits in the calculation.  CPUs with data-dependent multipliers
Packit 5c3484
   will want to use umul_ppmm.1 to get some randomization into the
Packit 5c3484
   calculation.  The extra xors and fetches will be a slowdown of course.  */
Packit 5c3484
Packit 5c3484
#define SPEED_MACRO_UMUL_PPMM_A \
Packit 5c3484
  {                             \
Packit 5c3484
    mp_limb_t  h, l;            \
Packit 5c3484
    unsigned   i;               \
Packit 5c3484
    double     t;               \
Packit 5c3484
				\
Packit 5c3484
    s->time_divisor = 10;       \
Packit 5c3484
				\
Packit 5c3484
    h = s->xp[0];               \
Packit 5c3484
    l = s->yp[0];               \
Packit 5c3484
				\
Packit 5c3484
    if (s->r == 1)              \
Packit 5c3484
      {                         \
Packit 5c3484
	speed_starttime ();     \
Packit 5c3484
	i = s->reps;            \
Packit 5c3484
	do                      \
Packit 5c3484
	  {
Packit 5c3484
Packit 5c3484
#define SPEED_MACRO_UMUL_PPMM_B \
Packit 5c3484
	  }                     \
Packit 5c3484
	while (--i != 0);       \
Packit 5c3484
	t = speed_endtime ();   \
Packit 5c3484
      }                         \
Packit 5c3484
    else                        \
Packit 5c3484
      {                         \
Packit 5c3484
	speed_starttime ();     \
Packit 5c3484
	i = s->reps;            \
Packit 5c3484
	do                      \
Packit 5c3484
	  {
Packit 5c3484
Packit 5c3484
#define SPEED_MACRO_UMUL_PPMM_C                                         \
Packit 5c3484
	  }                                                             \
Packit 5c3484
	while (--i != 0);                                               \
Packit 5c3484
	t = speed_endtime ();                                           \
Packit 5c3484
      }                                                                 \
Packit 5c3484
									\
Packit 5c3484
    /* stop the compiler optimizing away the whole calculation! */      \
Packit 5c3484
    noop_1 (h);                                                         \
Packit 5c3484
    noop_1 (l);                                                         \
Packit 5c3484
									\
Packit 5c3484
    return t;                                                           \
Packit 5c3484
  }
Packit 5c3484
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_umul_ppmm (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_MACRO_UMUL_PPMM_A;
Packit 5c3484
  {
Packit 5c3484
    umul_ppmm (h, l, l, h);  h ^= s->xp_block[0]; l ^= s->yp_block[0];
Packit 5c3484
     umul_ppmm (h, l, l, h); h ^= s->xp_block[1]; l ^= s->yp_block[1];
Packit 5c3484
     umul_ppmm (h, l, l, h); h ^= s->xp_block[2]; l ^= s->yp_block[2];
Packit 5c3484
    umul_ppmm (h, l, l, h);  h ^= s->xp_block[3]; l ^= s->yp_block[3];
Packit 5c3484
     umul_ppmm (h, l, l, h); h ^= s->xp_block[4]; l ^= s->yp_block[4];
Packit 5c3484
     umul_ppmm (h, l, l, h); h ^= s->xp_block[5]; l ^= s->yp_block[5];
Packit 5c3484
    umul_ppmm (h, l, l, h);  h ^= s->xp_block[6]; l ^= s->yp_block[6];
Packit 5c3484
     umul_ppmm (h, l, l, h); h ^= s->xp_block[7]; l ^= s->yp_block[7];
Packit 5c3484
     umul_ppmm (h, l, l, h); h ^= s->xp_block[8]; l ^= s->yp_block[8];
Packit 5c3484
    umul_ppmm (h, l, l, h);  h ^= s->xp_block[9]; l ^= s->yp_block[9];
Packit 5c3484
  }
Packit 5c3484
  SPEED_MACRO_UMUL_PPMM_B;
Packit 5c3484
  {
Packit 5c3484
    umul_ppmm (h, l, l, h);
Packit 5c3484
     umul_ppmm (h, l, l, h);
Packit 5c3484
     umul_ppmm (h, l, l, h);
Packit 5c3484
    umul_ppmm (h, l, l, h);
Packit 5c3484
     umul_ppmm (h, l, l, h);
Packit 5c3484
     umul_ppmm (h, l, l, h);
Packit 5c3484
    umul_ppmm (h, l, l, h);
Packit 5c3484
     umul_ppmm (h, l, l, h);
Packit 5c3484
     umul_ppmm (h, l, l, h);
Packit 5c3484
    umul_ppmm (h, l, l, h);
Packit 5c3484
  }
Packit 5c3484
  SPEED_MACRO_UMUL_PPMM_C;
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
Packit 5c3484
#if HAVE_NATIVE_mpn_umul_ppmm
Packit 5c3484
double
Packit 5c3484
speed_mpn_umul_ppmm (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_MACRO_UMUL_PPMM_A;
Packit 5c3484
  {
Packit 5c3484
    h = mpn_umul_ppmm (&l, h, l);  h ^= s->xp_block[0]; l ^= s->yp_block[0];
Packit 5c3484
     h = mpn_umul_ppmm (&l, h, l); h ^= s->xp_block[1]; l ^= s->yp_block[1];
Packit 5c3484
     h = mpn_umul_ppmm (&l, h, l); h ^= s->xp_block[2]; l ^= s->yp_block[2];
Packit 5c3484
    h = mpn_umul_ppmm (&l, h, l);  h ^= s->xp_block[3]; l ^= s->yp_block[3];
Packit 5c3484
     h = mpn_umul_ppmm (&l, h, l); h ^= s->xp_block[4]; l ^= s->yp_block[4];
Packit 5c3484
     h = mpn_umul_ppmm (&l, h, l); h ^= s->xp_block[5]; l ^= s->yp_block[5];
Packit 5c3484
    h = mpn_umul_ppmm (&l, h, l);  h ^= s->xp_block[6]; l ^= s->yp_block[6];
Packit 5c3484
     h = mpn_umul_ppmm (&l, h, l); h ^= s->xp_block[7]; l ^= s->yp_block[7];
Packit 5c3484
     h = mpn_umul_ppmm (&l, h, l); h ^= s->xp_block[8]; l ^= s->yp_block[8];
Packit 5c3484
    h = mpn_umul_ppmm (&l, h, l);  h ^= s->xp_block[9]; l ^= s->yp_block[9];
Packit 5c3484
  }
Packit 5c3484
  SPEED_MACRO_UMUL_PPMM_B;
Packit 5c3484
  {
Packit 5c3484
    h = mpn_umul_ppmm (&l, h, l);
Packit 5c3484
     h = mpn_umul_ppmm (&l, h, l);
Packit 5c3484
     h = mpn_umul_ppmm (&l, h, l);
Packit 5c3484
    h = mpn_umul_ppmm (&l, h, l);
Packit 5c3484
     h = mpn_umul_ppmm (&l, h, l);
Packit 5c3484
     h = mpn_umul_ppmm (&l, h, l);
Packit 5c3484
    h = mpn_umul_ppmm (&l, h, l);
Packit 5c3484
     h = mpn_umul_ppmm (&l, h, l);
Packit 5c3484
     h = mpn_umul_ppmm (&l, h, l);
Packit 5c3484
    h = mpn_umul_ppmm (&l, h, l);
Packit 5c3484
  }
Packit 5c3484
  SPEED_MACRO_UMUL_PPMM_C;
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
Packit 5c3484
#if HAVE_NATIVE_mpn_umul_ppmm_r
Packit 5c3484
double
Packit 5c3484
speed_mpn_umul_ppmm_r (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_MACRO_UMUL_PPMM_A;
Packit 5c3484
  {
Packit 5c3484
    h = mpn_umul_ppmm_r (h, l, &l);  h ^= s->xp_block[0]; l ^= s->yp_block[0];
Packit 5c3484
     h = mpn_umul_ppmm_r (h, l, &l); h ^= s->xp_block[1]; l ^= s->yp_block[1];
Packit 5c3484
     h = mpn_umul_ppmm_r (h, l, &l); h ^= s->xp_block[2]; l ^= s->yp_block[2];
Packit 5c3484
    h = mpn_umul_ppmm_r (h, l, &l);  h ^= s->xp_block[3]; l ^= s->yp_block[3];
Packit 5c3484
     h = mpn_umul_ppmm_r (h, l, &l); h ^= s->xp_block[4]; l ^= s->yp_block[4];
Packit 5c3484
     h = mpn_umul_ppmm_r (h, l, &l); h ^= s->xp_block[5]; l ^= s->yp_block[5];
Packit 5c3484
    h = mpn_umul_ppmm_r (h, l, &l);  h ^= s->xp_block[6]; l ^= s->yp_block[6];
Packit 5c3484
     h = mpn_umul_ppmm_r (h, l, &l); h ^= s->xp_block[7]; l ^= s->yp_block[7];
Packit 5c3484
     h = mpn_umul_ppmm_r (h, l, &l); h ^= s->xp_block[8]; l ^= s->yp_block[8];
Packit 5c3484
    h = mpn_umul_ppmm_r (h, l, &l);  h ^= s->xp_block[9]; l ^= s->yp_block[9];
Packit 5c3484
  }
Packit 5c3484
  SPEED_MACRO_UMUL_PPMM_B;
Packit 5c3484
  {
Packit 5c3484
    h = mpn_umul_ppmm_r (h, l, &l);
Packit 5c3484
     h = mpn_umul_ppmm_r (h, l, &l);
Packit 5c3484
     h = mpn_umul_ppmm_r (h, l, &l);
Packit 5c3484
    h = mpn_umul_ppmm_r (h, l, &l);
Packit 5c3484
     h = mpn_umul_ppmm_r (h, l, &l);
Packit 5c3484
     h = mpn_umul_ppmm_r (h, l, &l);
Packit 5c3484
    h = mpn_umul_ppmm_r (h, l, &l);
Packit 5c3484
     h = mpn_umul_ppmm_r (h, l, &l);
Packit 5c3484
     h = mpn_umul_ppmm_r (h, l, &l);
Packit 5c3484
    h = mpn_umul_ppmm_r (h, l, &l);
Packit 5c3484
  }
Packit 5c3484
  SPEED_MACRO_UMUL_PPMM_C;
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
Packit 5c3484
Packit 5c3484
/* The divisions are successively dependent so latency is measured, not
Packit 5c3484
   issue rate.  There's only 10 per loop so the code doesn't get too big,
Packit 5c3484
   especially for udiv_qrnnd_preinv and preinv2norm, which are several
Packit 5c3484
   instructions each.
Packit 5c3484
Packit 5c3484
   Note that it's only the division which is measured here, there's no data
Packit 5c3484
   fetching and no shifting if the divisor gets normalized.
Packit 5c3484
Packit 5c3484
   In speed_udiv_qrnnd with gcc 2.95.2 on x86 the parameters "q,r,r,q,d"
Packit 5c3484
   generate x86 div instructions with nothing in between.
Packit 5c3484
Packit 5c3484
   The measuring function macros are in two parts to avoid overflowing
Packit 5c3484
   preprocessor expansion space if udiv_qrnnd etc are big.
Packit 5c3484
Packit 5c3484
   Limitations:
Packit 5c3484
Packit 5c3484
   Don't blindly use this to set UDIV_TIME in gmp-mparam.h, check the code
Packit 5c3484
   generated first.
Packit 5c3484
Packit 5c3484
   CPUs with data-dependent divisions may want more attention paid to the
Packit 5c3484
   randomness of the data used.  Probably the measurement wanted is over
Packit 5c3484
   uniformly distributed numbers, but what's here might not be giving that.  */
Packit 5c3484
Packit 5c3484
#define SPEED_ROUTINE_UDIV_QRNND_A(normalize)           \
Packit 5c3484
  {                                                     \
Packit 5c3484
    double     t;                                       \
Packit 5c3484
    unsigned   i;                                       \
Packit 5c3484
    mp_limb_t  q, r, d;                                 \
Packit 5c3484
    mp_limb_t  dinv;                                    \
Packit 5c3484
							\
Packit 5c3484
    s->time_divisor = 10;                               \
Packit 5c3484
							\
Packit 5c3484
    /* divisor from "r" parameter, or a default */      \
Packit 5c3484
    d = s->r;                                           \
Packit 5c3484
    if (d == 0)                                         \
Packit 5c3484
      d = mp_bases[10].big_base;                        \
Packit 5c3484
							\
Packit 5c3484
    if (normalize)                                      \
Packit 5c3484
      {                                                 \
Packit 5c3484
	unsigned  norm;                                 \
Packit 5c3484
	count_leading_zeros (norm, d);                  \
Packit 5c3484
	d <<= norm;                                     \
Packit 5c3484
	invert_limb (dinv, d);                          \
Packit 5c3484
      }                                                 \
Packit 5c3484
							\
Packit 5c3484
    q = s->xp[0];                                       \
Packit 5c3484
    r = s->yp[0] % d;                                   \
Packit 5c3484
							\
Packit 5c3484
    speed_starttime ();                                 \
Packit 5c3484
    i = s->reps;                                        \
Packit 5c3484
    do                                                  \
Packit 5c3484
      {
Packit 5c3484
Packit 5c3484
#define SPEED_ROUTINE_UDIV_QRNND_B                                      \
Packit 5c3484
      }                                                                 \
Packit 5c3484
    while (--i != 0);                                                   \
Packit 5c3484
    t = speed_endtime ();                                               \
Packit 5c3484
									\
Packit 5c3484
    /* stop the compiler optimizing away the whole calculation! */      \
Packit 5c3484
    noop_1 (q);                                                         \
Packit 5c3484
    noop_1 (r);                                                         \
Packit 5c3484
									\
Packit 5c3484
    return t;                                                           \
Packit 5c3484
  }
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_udiv_qrnnd (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_UDIV_QRNND_A (UDIV_NEEDS_NORMALIZATION);
Packit 5c3484
  {
Packit 5c3484
    udiv_qrnnd (q, r, r, q, d);
Packit 5c3484
     udiv_qrnnd (q, r, r, q, d);
Packit 5c3484
     udiv_qrnnd (q, r, r, q, d);
Packit 5c3484
    udiv_qrnnd (q, r, r, q, d);
Packit 5c3484
     udiv_qrnnd (q, r, r, q, d);
Packit 5c3484
     udiv_qrnnd (q, r, r, q, d);
Packit 5c3484
    udiv_qrnnd (q, r, r, q, d);
Packit 5c3484
     udiv_qrnnd (q, r, r, q, d);
Packit 5c3484
     udiv_qrnnd (q, r, r, q, d);
Packit 5c3484
    udiv_qrnnd (q, r, r, q, d);
Packit 5c3484
  }
Packit 5c3484
  SPEED_ROUTINE_UDIV_QRNND_B;
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_udiv_qrnnd_c (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_UDIV_QRNND_A (1);
Packit 5c3484
  {
Packit 5c3484
    __udiv_qrnnd_c (q, r, r, q, d);
Packit 5c3484
     __udiv_qrnnd_c (q, r, r, q, d);
Packit 5c3484
     __udiv_qrnnd_c (q, r, r, q, d);
Packit 5c3484
    __udiv_qrnnd_c (q, r, r, q, d);
Packit 5c3484
     __udiv_qrnnd_c (q, r, r, q, d);
Packit 5c3484
     __udiv_qrnnd_c (q, r, r, q, d);
Packit 5c3484
    __udiv_qrnnd_c (q, r, r, q, d);
Packit 5c3484
     __udiv_qrnnd_c (q, r, r, q, d);
Packit 5c3484
     __udiv_qrnnd_c (q, r, r, q, d);
Packit 5c3484
    __udiv_qrnnd_c (q, r, r, q, d);
Packit 5c3484
  }
Packit 5c3484
  SPEED_ROUTINE_UDIV_QRNND_B;
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
#if HAVE_NATIVE_mpn_udiv_qrnnd
Packit 5c3484
double
Packit 5c3484
speed_mpn_udiv_qrnnd (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_UDIV_QRNND_A (1);
Packit 5c3484
  {
Packit 5c3484
    q = mpn_udiv_qrnnd (&r, r, q, d);
Packit 5c3484
     q = mpn_udiv_qrnnd (&r, r, q, d);
Packit 5c3484
     q = mpn_udiv_qrnnd (&r, r, q, d);
Packit 5c3484
    q = mpn_udiv_qrnnd (&r, r, q, d);
Packit 5c3484
     q = mpn_udiv_qrnnd (&r, r, q, d);
Packit 5c3484
     q = mpn_udiv_qrnnd (&r, r, q, d);
Packit 5c3484
    q = mpn_udiv_qrnnd (&r, r, q, d);
Packit 5c3484
     q = mpn_udiv_qrnnd (&r, r, q, d);
Packit 5c3484
     q = mpn_udiv_qrnnd (&r, r, q, d);
Packit 5c3484
    q = mpn_udiv_qrnnd (&r, r, q, d);
Packit 5c3484
  }
Packit 5c3484
  SPEED_ROUTINE_UDIV_QRNND_B;
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
Packit 5c3484
#if HAVE_NATIVE_mpn_udiv_qrnnd_r
Packit 5c3484
double
Packit 5c3484
speed_mpn_udiv_qrnnd_r (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_UDIV_QRNND_A (1);
Packit 5c3484
  {
Packit 5c3484
    q = mpn_udiv_qrnnd_r (r, q, d, &r);
Packit 5c3484
     q = mpn_udiv_qrnnd_r (r, q, d, &r);
Packit 5c3484
     q = mpn_udiv_qrnnd_r (r, q, d, &r);
Packit 5c3484
    q = mpn_udiv_qrnnd_r (r, q, d, &r);
Packit 5c3484
     q = mpn_udiv_qrnnd_r (r, q, d, &r);
Packit 5c3484
     q = mpn_udiv_qrnnd_r (r, q, d, &r);
Packit 5c3484
    q = mpn_udiv_qrnnd_r (r, q, d, &r);
Packit 5c3484
     q = mpn_udiv_qrnnd_r (r, q, d, &r);
Packit 5c3484
     q = mpn_udiv_qrnnd_r (r, q, d, &r);
Packit 5c3484
    q = mpn_udiv_qrnnd_r (r, q, d, &r);
Packit 5c3484
  }
Packit 5c3484
  SPEED_ROUTINE_UDIV_QRNND_B;
Packit 5c3484
}
Packit 5c3484
#endif
Packit 5c3484
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_invert_limb (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_INVERT_LIMB_CALL (invert_limb (dinv, d));
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
Packit 5c3484
/* xp[0] might not be particularly random, but should give an indication how
Packit 5c3484
   "/" runs.  Same for speed_operator_mod below.  */
Packit 5c3484
double
Packit 5c3484
speed_operator_div (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  double     t;
Packit 5c3484
  unsigned   i;
Packit 5c3484
  mp_limb_t  x, q, d;
Packit 5c3484
Packit 5c3484
  s->time_divisor = 10;
Packit 5c3484
Packit 5c3484
  /* divisor from "r" parameter, or a default */
Packit 5c3484
  d = s->r;
Packit 5c3484
  if (d == 0)
Packit 5c3484
    d = mp_bases[10].big_base;
Packit 5c3484
Packit 5c3484
  x = s->xp[0];
Packit 5c3484
  q = 0;
Packit 5c3484
Packit 5c3484
  speed_starttime ();
Packit 5c3484
  i = s->reps;
Packit 5c3484
  do
Packit 5c3484
    {
Packit 5c3484
      q ^= x; q /= d;
Packit 5c3484
       q ^= x; q /= d;
Packit 5c3484
       q ^= x; q /= d;
Packit 5c3484
      q ^= x; q /= d;
Packit 5c3484
       q ^= x; q /= d;
Packit 5c3484
       q ^= x; q /= d;
Packit 5c3484
      q ^= x; q /= d;
Packit 5c3484
       q ^= x; q /= d;
Packit 5c3484
       q ^= x; q /= d;
Packit 5c3484
      q ^= x; q /= d;
Packit 5c3484
    }
Packit 5c3484
  while (--i != 0);
Packit 5c3484
  t = speed_endtime ();
Packit 5c3484
Packit 5c3484
  /* stop the compiler optimizing away the whole calculation! */
Packit 5c3484
  noop_1 (q);
Packit 5c3484
Packit 5c3484
  return t;
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_operator_mod (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  double     t;
Packit 5c3484
  unsigned   i;
Packit 5c3484
  mp_limb_t  x, r, d;
Packit 5c3484
Packit 5c3484
  s->time_divisor = 10;
Packit 5c3484
Packit 5c3484
  /* divisor from "r" parameter, or a default */
Packit 5c3484
  d = s->r;
Packit 5c3484
  if (d == 0)
Packit 5c3484
    d = mp_bases[10].big_base;
Packit 5c3484
Packit 5c3484
  x = s->xp[0];
Packit 5c3484
  r = 0;
Packit 5c3484
Packit 5c3484
  speed_starttime ();
Packit 5c3484
  i = s->reps;
Packit 5c3484
  do
Packit 5c3484
    {
Packit 5c3484
      r ^= x; r %= d;
Packit 5c3484
       r ^= x; r %= d;
Packit 5c3484
       r ^= x; r %= d;
Packit 5c3484
      r ^= x; r %= d;
Packit 5c3484
       r ^= x; r %= d;
Packit 5c3484
       r ^= x; r %= d;
Packit 5c3484
      r ^= x; r %= d;
Packit 5c3484
       r ^= x; r %= d;
Packit 5c3484
       r ^= x; r %= d;
Packit 5c3484
      r ^= x; r %= d;
Packit 5c3484
    }
Packit 5c3484
  while (--i != 0);
Packit 5c3484
  t = speed_endtime ();
Packit 5c3484
Packit 5c3484
  /* stop the compiler optimizing away the whole calculation! */
Packit 5c3484
  noop_1 (r);
Packit 5c3484
Packit 5c3484
  return t;
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
Packit 5c3484
/* r==0 measures on data with the values uniformly distributed.  This will
Packit 5c3484
   be typical for count_trailing_zeros in a GCD etc.
Packit 5c3484
Packit 5c3484
   r==1 measures on data with the resultant count uniformly distributed
Packit 5c3484
   between 0 and GMP_LIMB_BITS-1.  This is probably sensible for
Packit 5c3484
   count_leading_zeros on the high limbs of divisors.  */
Packit 5c3484
Packit 5c3484
int
Packit 5c3484
speed_routine_count_zeros_setup (struct speed_params *s,
Packit 5c3484
				 mp_ptr xp, int leading, int zero)
Packit 5c3484
{
Packit 5c3484
  int        i, c;
Packit 5c3484
  mp_limb_t  n;
Packit 5c3484
Packit 5c3484
  if (s->r == 0)
Packit 5c3484
    {
Packit 5c3484
      /* Make uniformly distributed data.  If zero isn't allowed then change
Packit 5c3484
	 it to 1 for leading, or 0x800..00 for trailing.  */
Packit 5c3484
      MPN_COPY (xp, s->xp_block, SPEED_BLOCK_SIZE);
Packit 5c3484
      if (! zero)
Packit 5c3484
	for (i = 0; i < SPEED_BLOCK_SIZE; i++)
Packit 5c3484
	  if (xp[i] == 0)
Packit 5c3484
	    xp[i] = leading ? 1 : GMP_LIMB_HIGHBIT;
Packit 5c3484
    }
Packit 5c3484
  else if (s->r == 1)
Packit 5c3484
    {
Packit 5c3484
      /* Make counts uniformly distributed.  A randomly chosen bit is set, and
Packit 5c3484
	 for leading the rest above it are cleared, or for trailing then the
Packit 5c3484
	 rest below.  */
Packit 5c3484
      for (i = 0; i < SPEED_BLOCK_SIZE; i++)
Packit 5c3484
	{
Packit 5c3484
	  mp_limb_t  set = CNST_LIMB(1) << (s->yp_block[i] % GMP_LIMB_BITS);
Packit 5c3484
	  mp_limb_t  keep_below = set-1;
Packit 5c3484
	  mp_limb_t  keep_above = MP_LIMB_T_MAX ^ keep_below;
Packit 5c3484
	  mp_limb_t  keep = (leading ? keep_below : keep_above);
Packit 5c3484
	  xp[i] = (s->xp_block[i] & keep) | set;
Packit 5c3484
	}
Packit 5c3484
    }
Packit 5c3484
  else
Packit 5c3484
    {
Packit 5c3484
      return 0;
Packit 5c3484
    }
Packit 5c3484
Packit 5c3484
  /* Account for the effect of n^=c. */
Packit 5c3484
  c = 0;
Packit 5c3484
  for (i = 0; i < SPEED_BLOCK_SIZE; i++)
Packit 5c3484
    {
Packit 5c3484
      n = xp[i];
Packit 5c3484
      xp[i] ^= c;
Packit 5c3484
Packit 5c3484
      if (leading)
Packit 5c3484
	count_leading_zeros (c, n);
Packit 5c3484
      else
Packit 5c3484
	count_trailing_zeros (c, n);
Packit 5c3484
    }
Packit 5c3484
Packit 5c3484
  return 1;
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_count_leading_zeros (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
#ifdef COUNT_LEADING_ZEROS_0
Packit 5c3484
#define COUNT_LEADING_ZEROS_0_ALLOWED   1
Packit 5c3484
#else
Packit 5c3484
#define COUNT_LEADING_ZEROS_0_ALLOWED   0
Packit 5c3484
#endif
Packit 5c3484
Packit 5c3484
  SPEED_ROUTINE_COUNT_ZEROS_A (1, COUNT_LEADING_ZEROS_0_ALLOWED);
Packit 5c3484
  count_leading_zeros (c, n);
Packit 5c3484
  SPEED_ROUTINE_COUNT_ZEROS_B ();
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_count_trailing_zeros (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_COUNT_ZEROS_A (0, 0);
Packit 5c3484
  count_trailing_zeros (c, n);
Packit 5c3484
  SPEED_ROUTINE_COUNT_ZEROS_B ();
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_get_str (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_GET_STR (mpn_get_str);
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpn_set_str (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_SET_STR_CALL (mpn_set_str (wp, xp, s->size, base));
Packit 5c3484
}
Packit 5c3484
double
Packit 5c3484
speed_mpn_bc_set_str (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_SET_STR_CALL (mpn_bc_set_str (wp, xp, s->size, base));
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_MPN_ZERO (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  SPEED_ROUTINE_MPN_ZERO_CALL (MPN_ZERO (wp, s->size));
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
Packit 5c3484
int
Packit 5c3484
speed_randinit (struct speed_params *s, gmp_randstate_ptr rstate)
Packit 5c3484
{
Packit 5c3484
  if (s->r == 0)
Packit 5c3484
    gmp_randinit_default (rstate);
Packit 5c3484
  else if (s->r == 1)
Packit 5c3484
    gmp_randinit_mt (rstate);
Packit 5c3484
  else
Packit 5c3484
    {
Packit 5c3484
      return gmp_randinit_lc_2exp_size (rstate, s->r);
Packit 5c3484
    }
Packit 5c3484
  return 1;
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_gmp_randseed (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  gmp_randstate_t  rstate;
Packit 5c3484
  unsigned  i;
Packit 5c3484
  double    t;
Packit 5c3484
  mpz_t     x;
Packit 5c3484
Packit 5c3484
  SPEED_RESTRICT_COND (s->size >= 1);
Packit 5c3484
  SPEED_RESTRICT_COND (speed_randinit (s, rstate));
Packit 5c3484
Packit 5c3484
  /* s->size bits of seed */
Packit 5c3484
  mpz_init_set_n (x, s->xp, s->size);
Packit 5c3484
  mpz_fdiv_r_2exp (x, x, (unsigned long) s->size);
Packit 5c3484
Packit 5c3484
  /* cache priming */
Packit 5c3484
  gmp_randseed (rstate, x);
Packit 5c3484
Packit 5c3484
  speed_starttime ();
Packit 5c3484
  i = s->reps;
Packit 5c3484
  do
Packit 5c3484
    gmp_randseed (rstate, x);
Packit 5c3484
  while (--i != 0);
Packit 5c3484
  t = speed_endtime ();
Packit 5c3484
Packit 5c3484
  gmp_randclear (rstate);
Packit 5c3484
  mpz_clear (x);
Packit 5c3484
  return t;
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_gmp_randseed_ui (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  gmp_randstate_t  rstate;
Packit 5c3484
  unsigned  i, j;
Packit 5c3484
  double    t;
Packit 5c3484
Packit 5c3484
  SPEED_RESTRICT_COND (speed_randinit (s, rstate));
Packit 5c3484
Packit 5c3484
  /* cache priming */
Packit 5c3484
  gmp_randseed_ui (rstate, 123L);
Packit 5c3484
Packit 5c3484
  speed_starttime ();
Packit 5c3484
  i = s->reps;
Packit 5c3484
  j = 0;
Packit 5c3484
  do
Packit 5c3484
    {
Packit 5c3484
      gmp_randseed_ui (rstate, (unsigned long) s->xp_block[j]);
Packit 5c3484
      j++;
Packit 5c3484
      if (j >= SPEED_BLOCK_SIZE)
Packit 5c3484
	j = 0;
Packit 5c3484
    }
Packit 5c3484
  while (--i != 0);
Packit 5c3484
  t = speed_endtime ();
Packit 5c3484
Packit 5c3484
  gmp_randclear (rstate);
Packit 5c3484
  return t;
Packit 5c3484
}
Packit 5c3484
Packit 5c3484
double
Packit 5c3484
speed_mpz_urandomb (struct speed_params *s)
Packit 5c3484
{
Packit 5c3484
  gmp_randstate_t  rstate;
Packit 5c3484
  mpz_t     z;
Packit 5c3484
  unsigned  i;
Packit 5c3484
  double    t;
Packit 5c3484
Packit 5c3484
  SPEED_RESTRICT_COND (s->size >= 0);
Packit 5c3484
  SPEED_RESTRICT_COND (speed_randinit (s, rstate));
Packit 5c3484
Packit 5c3484
  mpz_init (z);
Packit 5c3484
Packit 5c3484
  /* cache priming */
Packit 5c3484
  mpz_urandomb (z, rstate, (unsigned long) s->size);
Packit 5c3484
  mpz_urandomb (z, rstate, (unsigned long) s->size);
Packit 5c3484
Packit 5c3484
  speed_starttime ();
Packit 5c3484
  i = s->reps;
Packit 5c3484
  do
Packit 5c3484
    mpz_urandomb (z, rstate, (unsigned long) s->size);
Packit 5c3484
  while (--i != 0);
Packit 5c3484
  t = speed_endtime ();
Packit 5c3484
Packit 5c3484
  mpz_clear (z);
Packit 5c3484
  gmp_randclear (rstate);
Packit 5c3484
  return t;
Packit 5c3484
}