Blame soft-fp/op-4.h

Packit 6c4009
/* Software floating-point emulation.
Packit 6c4009
   Basic four-word fraction declaration and manipulation.
Packit 6c4009
   Copyright (C) 1997-2018 Free Software Foundation, Inc.
Packit 6c4009
   This file is part of the GNU C Library.
Packit 6c4009
   Contributed by Richard Henderson (rth@cygnus.com),
Packit 6c4009
		  Jakub Jelinek (jj@ultra.linux.cz),
Packit 6c4009
		  David S. Miller (davem@redhat.com) and
Packit 6c4009
		  Peter Maydell (pmaydell@chiark.greenend.org.uk).
Packit 6c4009
Packit 6c4009
   The GNU C Library is free software; you can redistribute it and/or
Packit 6c4009
   modify it under the terms of the GNU Lesser General Public
Packit 6c4009
   License as published by the Free Software Foundation; either
Packit 6c4009
   version 2.1 of the License, or (at your option) any later version.
Packit 6c4009
Packit 6c4009
   In addition to the permissions in the GNU Lesser General Public
Packit 6c4009
   License, the Free Software Foundation gives you unlimited
Packit 6c4009
   permission to link the compiled version of this file into
Packit 6c4009
   combinations with other programs, and to distribute those
Packit 6c4009
   combinations without any restriction coming from the use of this
Packit 6c4009
   file.  (The Lesser General Public License restrictions do apply in
Packit 6c4009
   other respects; for example, they cover modification of the file,
Packit 6c4009
   and distribution when not linked into a combine executable.)
Packit 6c4009
Packit 6c4009
   The GNU C Library is distributed in the hope that it will be useful,
Packit 6c4009
   but WITHOUT ANY WARRANTY; without even the implied warranty of
Packit 6c4009
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
Packit 6c4009
   Lesser General Public License for more details.
Packit 6c4009
Packit 6c4009
   You should have received a copy of the GNU Lesser General Public
Packit 6c4009
   License along with the GNU C Library; if not, see
Packit 6c4009
   <http://www.gnu.org/licenses/>.  */
Packit 6c4009
Packit 6c4009
#ifndef SOFT_FP_OP_4_H
Packit 6c4009
#define SOFT_FP_OP_4_H	1
Packit 6c4009
Packit 6c4009
#define _FP_FRAC_DECL_4(X)	_FP_W_TYPE X##_f[4]
Packit 6c4009
#define _FP_FRAC_COPY_4(D, S)			\
Packit 6c4009
  (D##_f[0] = S##_f[0], D##_f[1] = S##_f[1],	\
Packit 6c4009
   D##_f[2] = S##_f[2], D##_f[3] = S##_f[3])
Packit 6c4009
#define _FP_FRAC_SET_4(X, I)	__FP_FRAC_SET_4 (X, I)
Packit 6c4009
#define _FP_FRAC_HIGH_4(X)	(X##_f[3])
Packit 6c4009
#define _FP_FRAC_LOW_4(X)	(X##_f[0])
Packit 6c4009
#define _FP_FRAC_WORD_4(X, w)	(X##_f[w])
Packit 6c4009
Packit 6c4009
#define _FP_FRAC_SLL_4(X, N)						\
Packit 6c4009
  do									\
Packit 6c4009
    {									\
Packit 6c4009
      _FP_I_TYPE _FP_FRAC_SLL_4_up, _FP_FRAC_SLL_4_down;		\
Packit 6c4009
      _FP_I_TYPE _FP_FRAC_SLL_4_skip, _FP_FRAC_SLL_4_i;			\
Packit 6c4009
      _FP_FRAC_SLL_4_skip = (N) / _FP_W_TYPE_SIZE;			\
Packit 6c4009
      _FP_FRAC_SLL_4_up = (N) % _FP_W_TYPE_SIZE;			\
Packit 6c4009
      _FP_FRAC_SLL_4_down = _FP_W_TYPE_SIZE - _FP_FRAC_SLL_4_up;	\
Packit 6c4009
      if (!_FP_FRAC_SLL_4_up)						\
Packit 6c4009
	for (_FP_FRAC_SLL_4_i = 3;					\
Packit 6c4009
	     _FP_FRAC_SLL_4_i >= _FP_FRAC_SLL_4_skip;			\
Packit 6c4009
	     --_FP_FRAC_SLL_4_i)					\
Packit 6c4009
	  X##_f[_FP_FRAC_SLL_4_i]					\
Packit 6c4009
	    = X##_f[_FP_FRAC_SLL_4_i-_FP_FRAC_SLL_4_skip];		\
Packit 6c4009
      else								\
Packit 6c4009
	{								\
Packit 6c4009
	  for (_FP_FRAC_SLL_4_i = 3;					\
Packit 6c4009
	       _FP_FRAC_SLL_4_i > _FP_FRAC_SLL_4_skip;			\
Packit 6c4009
	       --_FP_FRAC_SLL_4_i)					\
Packit 6c4009
	    X##_f[_FP_FRAC_SLL_4_i]					\
Packit 6c4009
	      = ((X##_f[_FP_FRAC_SLL_4_i-_FP_FRAC_SLL_4_skip]		\
Packit 6c4009
		  << _FP_FRAC_SLL_4_up)					\
Packit 6c4009
		 | (X##_f[_FP_FRAC_SLL_4_i-_FP_FRAC_SLL_4_skip-1]	\
Packit 6c4009
		    >> _FP_FRAC_SLL_4_down));				\
Packit 6c4009
	  X##_f[_FP_FRAC_SLL_4_i--] = X##_f[0] << _FP_FRAC_SLL_4_up;	\
Packit 6c4009
	}								\
Packit 6c4009
      for (; _FP_FRAC_SLL_4_i >= 0; --_FP_FRAC_SLL_4_i)			\
Packit 6c4009
	X##_f[_FP_FRAC_SLL_4_i] = 0;					\
Packit 6c4009
    }									\
Packit 6c4009
  while (0)
Packit 6c4009
Packit 6c4009
/* This one was broken too.  */
Packit 6c4009
#define _FP_FRAC_SRL_4(X, N)						\
Packit 6c4009
  do									\
Packit 6c4009
    {									\
Packit 6c4009
      _FP_I_TYPE _FP_FRAC_SRL_4_up, _FP_FRAC_SRL_4_down;		\
Packit 6c4009
      _FP_I_TYPE _FP_FRAC_SRL_4_skip, _FP_FRAC_SRL_4_i;			\
Packit 6c4009
      _FP_FRAC_SRL_4_skip = (N) / _FP_W_TYPE_SIZE;			\
Packit 6c4009
      _FP_FRAC_SRL_4_down = (N) % _FP_W_TYPE_SIZE;			\
Packit 6c4009
      _FP_FRAC_SRL_4_up = _FP_W_TYPE_SIZE - _FP_FRAC_SRL_4_down;	\
Packit 6c4009
      if (!_FP_FRAC_SRL_4_down)						\
Packit 6c4009
	for (_FP_FRAC_SRL_4_i = 0;					\
Packit 6c4009
	     _FP_FRAC_SRL_4_i <= 3-_FP_FRAC_SRL_4_skip;			\
Packit 6c4009
	     ++_FP_FRAC_SRL_4_i)					\
Packit 6c4009
	  X##_f[_FP_FRAC_SRL_4_i]					\
Packit 6c4009
	    = X##_f[_FP_FRAC_SRL_4_i+_FP_FRAC_SRL_4_skip];		\
Packit 6c4009
      else								\
Packit 6c4009
	{								\
Packit 6c4009
	  for (_FP_FRAC_SRL_4_i = 0;					\
Packit 6c4009
	       _FP_FRAC_SRL_4_i < 3-_FP_FRAC_SRL_4_skip;		\
Packit 6c4009
	       ++_FP_FRAC_SRL_4_i)					\
Packit 6c4009
	    X##_f[_FP_FRAC_SRL_4_i]					\
Packit 6c4009
	      = ((X##_f[_FP_FRAC_SRL_4_i+_FP_FRAC_SRL_4_skip]		\
Packit 6c4009
		  >> _FP_FRAC_SRL_4_down)				\
Packit 6c4009
		 | (X##_f[_FP_FRAC_SRL_4_i+_FP_FRAC_SRL_4_skip+1]	\
Packit 6c4009
		    << _FP_FRAC_SRL_4_up));				\
Packit 6c4009
	  X##_f[_FP_FRAC_SRL_4_i++] = X##_f[3] >> _FP_FRAC_SRL_4_down;	\
Packit 6c4009
	}								\
Packit 6c4009
      for (; _FP_FRAC_SRL_4_i < 4; ++_FP_FRAC_SRL_4_i)			\
Packit 6c4009
	X##_f[_FP_FRAC_SRL_4_i] = 0;					\
Packit 6c4009
    }									\
Packit 6c4009
  while (0)
Packit 6c4009
Packit 6c4009
Packit 6c4009
/* Right shift with sticky-lsb.
Packit 6c4009
   What this actually means is that we do a standard right-shift,
Packit 6c4009
   but that if any of the bits that fall off the right hand side
Packit 6c4009
   were one then we always set the LSbit.  */
Packit 6c4009
#define _FP_FRAC_SRST_4(X, S, N, size)					\
Packit 6c4009
  do									\
Packit 6c4009
    {									\
Packit 6c4009
      _FP_I_TYPE _FP_FRAC_SRST_4_up, _FP_FRAC_SRST_4_down;		\
Packit 6c4009
      _FP_I_TYPE _FP_FRAC_SRST_4_skip, _FP_FRAC_SRST_4_i;		\
Packit 6c4009
      _FP_W_TYPE _FP_FRAC_SRST_4_s;					\
Packit 6c4009
      _FP_FRAC_SRST_4_skip = (N) / _FP_W_TYPE_SIZE;			\
Packit 6c4009
      _FP_FRAC_SRST_4_down = (N) % _FP_W_TYPE_SIZE;			\
Packit 6c4009
      _FP_FRAC_SRST_4_up = _FP_W_TYPE_SIZE - _FP_FRAC_SRST_4_down;	\
Packit 6c4009
      for (_FP_FRAC_SRST_4_s = _FP_FRAC_SRST_4_i = 0;			\
Packit 6c4009
	   _FP_FRAC_SRST_4_i < _FP_FRAC_SRST_4_skip;			\
Packit 6c4009
	   ++_FP_FRAC_SRST_4_i)						\
Packit 6c4009
	_FP_FRAC_SRST_4_s |= X##_f[_FP_FRAC_SRST_4_i];			\
Packit 6c4009
      if (!_FP_FRAC_SRST_4_down)					\
Packit 6c4009
	for (_FP_FRAC_SRST_4_i = 0;					\
Packit 6c4009
	     _FP_FRAC_SRST_4_i <= 3-_FP_FRAC_SRST_4_skip;		\
Packit 6c4009
	     ++_FP_FRAC_SRST_4_i)					\
Packit 6c4009
	  X##_f[_FP_FRAC_SRST_4_i]					\
Packit 6c4009
	    = X##_f[_FP_FRAC_SRST_4_i+_FP_FRAC_SRST_4_skip];		\
Packit 6c4009
      else								\
Packit 6c4009
	{								\
Packit 6c4009
	  _FP_FRAC_SRST_4_s						\
Packit 6c4009
	    |= X##_f[_FP_FRAC_SRST_4_i] << _FP_FRAC_SRST_4_up;		\
Packit 6c4009
	  for (_FP_FRAC_SRST_4_i = 0;					\
Packit 6c4009
	       _FP_FRAC_SRST_4_i < 3-_FP_FRAC_SRST_4_skip;		\
Packit 6c4009
	       ++_FP_FRAC_SRST_4_i)					\
Packit 6c4009
	    X##_f[_FP_FRAC_SRST_4_i]					\
Packit 6c4009
	      = ((X##_f[_FP_FRAC_SRST_4_i+_FP_FRAC_SRST_4_skip]		\
Packit 6c4009
		  >> _FP_FRAC_SRST_4_down)				\
Packit 6c4009
		 | (X##_f[_FP_FRAC_SRST_4_i+_FP_FRAC_SRST_4_skip+1]	\
Packit 6c4009
		    << _FP_FRAC_SRST_4_up));				\
Packit 6c4009
	  X##_f[_FP_FRAC_SRST_4_i++]					\
Packit 6c4009
	    = X##_f[3] >> _FP_FRAC_SRST_4_down;				\
Packit 6c4009
	}								\
Packit 6c4009
      for (; _FP_FRAC_SRST_4_i < 4; ++_FP_FRAC_SRST_4_i)		\
Packit 6c4009
	X##_f[_FP_FRAC_SRST_4_i] = 0;					\
Packit 6c4009
      S = (_FP_FRAC_SRST_4_s != 0);					\
Packit 6c4009
    }									\
Packit 6c4009
  while (0)
Packit 6c4009
Packit 6c4009
#define _FP_FRAC_SRS_4(X, N, size)				\
Packit 6c4009
  do								\
Packit 6c4009
    {								\
Packit 6c4009
      int _FP_FRAC_SRS_4_sticky;				\
Packit 6c4009
      _FP_FRAC_SRST_4 (X, _FP_FRAC_SRS_4_sticky, (N), (size));	\
Packit 6c4009
      X##_f[0] |= _FP_FRAC_SRS_4_sticky;			\
Packit 6c4009
    }								\
Packit 6c4009
  while (0)
Packit 6c4009
Packit 6c4009
#define _FP_FRAC_ADD_4(R, X, Y)					\
Packit 6c4009
  __FP_FRAC_ADD_4 (R##_f[3], R##_f[2], R##_f[1], R##_f[0],	\
Packit 6c4009
		   X##_f[3], X##_f[2], X##_f[1], X##_f[0],	\
Packit 6c4009
		   Y##_f[3], Y##_f[2], Y##_f[1], Y##_f[0])
Packit 6c4009
Packit 6c4009
#define _FP_FRAC_SUB_4(R, X, Y)					\
Packit 6c4009
  __FP_FRAC_SUB_4 (R##_f[3], R##_f[2], R##_f[1], R##_f[0],	\
Packit 6c4009
		   X##_f[3], X##_f[2], X##_f[1], X##_f[0],	\
Packit 6c4009
		   Y##_f[3], Y##_f[2], Y##_f[1], Y##_f[0])
Packit 6c4009
Packit 6c4009
#define _FP_FRAC_DEC_4(X, Y)					\
Packit 6c4009
  __FP_FRAC_DEC_4 (X##_f[3], X##_f[2], X##_f[1], X##_f[0],	\
Packit 6c4009
		   Y##_f[3], Y##_f[2], Y##_f[1], Y##_f[0])
Packit 6c4009
Packit 6c4009
#define _FP_FRAC_ADDI_4(X, I)					\
Packit 6c4009
  __FP_FRAC_ADDI_4 (X##_f[3], X##_f[2], X##_f[1], X##_f[0], I)
Packit 6c4009
Packit 6c4009
#define _FP_ZEROFRAC_4  0, 0, 0, 0
Packit 6c4009
#define _FP_MINFRAC_4   0, 0, 0, 1
Packit 6c4009
#define _FP_MAXFRAC_4	(~(_FP_WS_TYPE) 0), (~(_FP_WS_TYPE) 0), (~(_FP_WS_TYPE) 0), (~(_FP_WS_TYPE) 0)
Packit 6c4009
Packit 6c4009
#define _FP_FRAC_ZEROP_4(X)     ((X##_f[0] | X##_f[1] | X##_f[2] | X##_f[3]) == 0)
Packit 6c4009
#define _FP_FRAC_NEGP_4(X)      ((_FP_WS_TYPE) X##_f[3] < 0)
Packit 6c4009
#define _FP_FRAC_OVERP_4(fs, X)  (_FP_FRAC_HIGH_##fs (X) & _FP_OVERFLOW_##fs)
Packit 6c4009
#define _FP_FRAC_HIGHBIT_DW_4(fs, X)	\
Packit 6c4009
  (_FP_FRAC_HIGH_DW_##fs (X) & _FP_HIGHBIT_DW_##fs)
Packit 6c4009
#define _FP_FRAC_CLEAR_OVERP_4(fs, X)  (_FP_FRAC_HIGH_##fs (X) &= ~_FP_OVERFLOW_##fs)
Packit 6c4009
Packit 6c4009
#define _FP_FRAC_EQ_4(X, Y)				\
Packit 6c4009
  (X##_f[0] == Y##_f[0] && X##_f[1] == Y##_f[1]		\
Packit 6c4009
   && X##_f[2] == Y##_f[2] && X##_f[3] == Y##_f[3])
Packit 6c4009
Packit 6c4009
#define _FP_FRAC_GT_4(X, Y)				\
Packit 6c4009
  (X##_f[3] > Y##_f[3]					\
Packit 6c4009
   || (X##_f[3] == Y##_f[3]				\
Packit 6c4009
       && (X##_f[2] > Y##_f[2]				\
Packit 6c4009
	   || (X##_f[2] == Y##_f[2]			\
Packit 6c4009
	       && (X##_f[1] > Y##_f[1]			\
Packit 6c4009
		   || (X##_f[1] == Y##_f[1]		\
Packit 6c4009
		       && X##_f[0] > Y##_f[0]))))))
Packit 6c4009
Packit 6c4009
#define _FP_FRAC_GE_4(X, Y)				\
Packit 6c4009
  (X##_f[3] > Y##_f[3]					\
Packit 6c4009
   || (X##_f[3] == Y##_f[3]				\
Packit 6c4009
       && (X##_f[2] > Y##_f[2]				\
Packit 6c4009
	   || (X##_f[2] == Y##_f[2]			\
Packit 6c4009
	       && (X##_f[1] > Y##_f[1]			\
Packit 6c4009
		   || (X##_f[1] == Y##_f[1]		\
Packit 6c4009
		       && X##_f[0] >= Y##_f[0]))))))
Packit 6c4009
Packit 6c4009
Packit 6c4009
#define _FP_FRAC_CLZ_4(R, X)			\
Packit 6c4009
  do						\
Packit 6c4009
    {						\
Packit 6c4009
      if (X##_f[3])				\
Packit 6c4009
	__FP_CLZ ((R), X##_f[3]);		\
Packit 6c4009
      else if (X##_f[2])			\
Packit 6c4009
	{					\
Packit 6c4009
	  __FP_CLZ ((R), X##_f[2]);		\
Packit 6c4009
	  (R) += _FP_W_TYPE_SIZE;		\
Packit 6c4009
	}					\
Packit 6c4009
      else if (X##_f[1])			\
Packit 6c4009
	{					\
Packit 6c4009
	  __FP_CLZ ((R), X##_f[1]);		\
Packit 6c4009
	  (R) += _FP_W_TYPE_SIZE*2;		\
Packit 6c4009
	}					\
Packit 6c4009
      else					\
Packit 6c4009
	{					\
Packit 6c4009
	  __FP_CLZ ((R), X##_f[0]);		\
Packit 6c4009
	  (R) += _FP_W_TYPE_SIZE*3;		\
Packit 6c4009
	}					\
Packit 6c4009
    }						\
Packit 6c4009
  while (0)
Packit 6c4009
Packit 6c4009
Packit 6c4009
#define _FP_UNPACK_RAW_4(fs, X, val)			\
Packit 6c4009
  do							\
Packit 6c4009
    {							\
Packit 6c4009
      union _FP_UNION_##fs _FP_UNPACK_RAW_4_flo;	\
Packit 6c4009
      _FP_UNPACK_RAW_4_flo.flt = (val);			\
Packit 6c4009
      X##_f[0] = _FP_UNPACK_RAW_4_flo.bits.frac0;	\
Packit 6c4009
      X##_f[1] = _FP_UNPACK_RAW_4_flo.bits.frac1;	\
Packit 6c4009
      X##_f[2] = _FP_UNPACK_RAW_4_flo.bits.frac2;	\
Packit 6c4009
      X##_f[3] = _FP_UNPACK_RAW_4_flo.bits.frac3;	\
Packit 6c4009
      X##_e  = _FP_UNPACK_RAW_4_flo.bits.exp;		\
Packit 6c4009
      X##_s  = _FP_UNPACK_RAW_4_flo.bits.sign;		\
Packit 6c4009
    }							\
Packit 6c4009
  while (0)
Packit 6c4009
Packit 6c4009
#define _FP_UNPACK_RAW_4_P(fs, X, val)			\
Packit 6c4009
  do							\
Packit 6c4009
    {							\
Packit 6c4009
      union _FP_UNION_##fs *_FP_UNPACK_RAW_4_P_flo	\
Packit 6c4009
	= (union _FP_UNION_##fs *) (val);		\
Packit 6c4009
							\
Packit 6c4009
      X##_f[0] = _FP_UNPACK_RAW_4_P_flo->bits.frac0;	\
Packit 6c4009
      X##_f[1] = _FP_UNPACK_RAW_4_P_flo->bits.frac1;	\
Packit 6c4009
      X##_f[2] = _FP_UNPACK_RAW_4_P_flo->bits.frac2;	\
Packit 6c4009
      X##_f[3] = _FP_UNPACK_RAW_4_P_flo->bits.frac3;	\
Packit 6c4009
      X##_e  = _FP_UNPACK_RAW_4_P_flo->bits.exp;	\
Packit 6c4009
      X##_s  = _FP_UNPACK_RAW_4_P_flo->bits.sign;	\
Packit 6c4009
    }							\
Packit 6c4009
  while (0)
Packit 6c4009
Packit 6c4009
#define _FP_PACK_RAW_4(fs, val, X)		\
Packit 6c4009
  do						\
Packit 6c4009
    {						\
Packit 6c4009
      union _FP_UNION_##fs _FP_PACK_RAW_4_flo;	\
Packit 6c4009
      _FP_PACK_RAW_4_flo.bits.frac0 = X##_f[0];	\
Packit 6c4009
      _FP_PACK_RAW_4_flo.bits.frac1 = X##_f[1];	\
Packit 6c4009
      _FP_PACK_RAW_4_flo.bits.frac2 = X##_f[2];	\
Packit 6c4009
      _FP_PACK_RAW_4_flo.bits.frac3 = X##_f[3];	\
Packit 6c4009
      _FP_PACK_RAW_4_flo.bits.exp   = X##_e;	\
Packit 6c4009
      _FP_PACK_RAW_4_flo.bits.sign  = X##_s;	\
Packit 6c4009
      (val) = _FP_PACK_RAW_4_flo.flt;		\
Packit 6c4009
    }						\
Packit 6c4009
  while (0)
Packit 6c4009
Packit 6c4009
#define _FP_PACK_RAW_4_P(fs, val, X)			\
Packit 6c4009
  do							\
Packit 6c4009
    {							\
Packit 6c4009
      union _FP_UNION_##fs *_FP_PACK_RAW_4_P_flo	\
Packit 6c4009
	= (union _FP_UNION_##fs *) (val);		\
Packit 6c4009
							\
Packit 6c4009
      _FP_PACK_RAW_4_P_flo->bits.frac0 = X##_f[0];	\
Packit 6c4009
      _FP_PACK_RAW_4_P_flo->bits.frac1 = X##_f[1];	\
Packit 6c4009
      _FP_PACK_RAW_4_P_flo->bits.frac2 = X##_f[2];	\
Packit 6c4009
      _FP_PACK_RAW_4_P_flo->bits.frac3 = X##_f[3];	\
Packit 6c4009
      _FP_PACK_RAW_4_P_flo->bits.exp   = X##_e;		\
Packit 6c4009
      _FP_PACK_RAW_4_P_flo->bits.sign  = X##_s;		\
Packit 6c4009
    }							\
Packit 6c4009
  while (0)
Packit 6c4009
Packit 6c4009
/* Multiplication algorithms: */
Packit 6c4009
Packit 6c4009
/* Given a 1W * 1W => 2W primitive, do the extended multiplication.  */
Packit 6c4009
Packit 6c4009
#define _FP_MUL_MEAT_DW_4_wide(wfracbits, R, X, Y, doit)		\
Packit 6c4009
  do									\
Packit 6c4009
    {									\
Packit 6c4009
      _FP_FRAC_DECL_2 (_FP_MUL_MEAT_DW_4_wide_b);			\
Packit 6c4009
      _FP_FRAC_DECL_2 (_FP_MUL_MEAT_DW_4_wide_c);			\
Packit 6c4009
      _FP_FRAC_DECL_2 (_FP_MUL_MEAT_DW_4_wide_d);			\
Packit 6c4009
      _FP_FRAC_DECL_2 (_FP_MUL_MEAT_DW_4_wide_e);			\
Packit 6c4009
      _FP_FRAC_DECL_2 (_FP_MUL_MEAT_DW_4_wide_f);			\
Packit 6c4009
									\
Packit 6c4009
      doit (_FP_FRAC_WORD_8 (R, 1), _FP_FRAC_WORD_8 (R, 0),		\
Packit 6c4009
	    X##_f[0], Y##_f[0]);					\
Packit 6c4009
      doit (_FP_MUL_MEAT_DW_4_wide_b_f1, _FP_MUL_MEAT_DW_4_wide_b_f0,	\
Packit 6c4009
	    X##_f[0], Y##_f[1]);					\
Packit 6c4009
      doit (_FP_MUL_MEAT_DW_4_wide_c_f1, _FP_MUL_MEAT_DW_4_wide_c_f0,	\
Packit 6c4009
	    X##_f[1], Y##_f[0]);					\
Packit 6c4009
      doit (_FP_MUL_MEAT_DW_4_wide_d_f1, _FP_MUL_MEAT_DW_4_wide_d_f0,	\
Packit 6c4009
	    X##_f[1], Y##_f[1]);					\
Packit 6c4009
      doit (_FP_MUL_MEAT_DW_4_wide_e_f1, _FP_MUL_MEAT_DW_4_wide_e_f0,	\
Packit 6c4009
	    X##_f[0], Y##_f[2]);					\
Packit 6c4009
      doit (_FP_MUL_MEAT_DW_4_wide_f_f1, _FP_MUL_MEAT_DW_4_wide_f_f0,	\
Packit 6c4009
	    X##_f[2], Y##_f[0]);					\
Packit 6c4009
      __FP_FRAC_ADD_3 (_FP_FRAC_WORD_8 (R, 3), _FP_FRAC_WORD_8 (R, 2),	\
Packit 6c4009
		       _FP_FRAC_WORD_8 (R, 1), 0,			\
Packit 6c4009
		       _FP_MUL_MEAT_DW_4_wide_b_f1,			\
Packit 6c4009
		       _FP_MUL_MEAT_DW_4_wide_b_f0,			\
Packit 6c4009
		       0, 0, _FP_FRAC_WORD_8 (R, 1));			\
Packit 6c4009
      __FP_FRAC_ADD_3 (_FP_FRAC_WORD_8 (R, 3), _FP_FRAC_WORD_8 (R, 2),	\
Packit 6c4009
		       _FP_FRAC_WORD_8 (R, 1), 0,			\
Packit 6c4009
		       _FP_MUL_MEAT_DW_4_wide_c_f1,			\
Packit 6c4009
		       _FP_MUL_MEAT_DW_4_wide_c_f0,			\
Packit 6c4009
		       _FP_FRAC_WORD_8 (R, 3), _FP_FRAC_WORD_8 (R, 2),	\
Packit 6c4009
		       _FP_FRAC_WORD_8 (R, 1));				\
Packit 6c4009
      __FP_FRAC_ADD_3 (_FP_FRAC_WORD_8 (R, 4), _FP_FRAC_WORD_8 (R, 3),	\
Packit 6c4009
		       _FP_FRAC_WORD_8 (R, 2), 0,			\
Packit 6c4009
		       _FP_MUL_MEAT_DW_4_wide_d_f1,			\
Packit 6c4009
		       _FP_MUL_MEAT_DW_4_wide_d_f0,			\
Packit 6c4009
		       0, _FP_FRAC_WORD_8 (R, 3), _FP_FRAC_WORD_8 (R, 2)); \
Packit 6c4009
      __FP_FRAC_ADD_3 (_FP_FRAC_WORD_8 (R, 4), _FP_FRAC_WORD_8 (R, 3),	\
Packit 6c4009
		       _FP_FRAC_WORD_8 (R, 2), 0,			\
Packit 6c4009
		       _FP_MUL_MEAT_DW_4_wide_e_f1,			\
Packit 6c4009
		       _FP_MUL_MEAT_DW_4_wide_e_f0,			\
Packit 6c4009
		       _FP_FRAC_WORD_8 (R, 4), _FP_FRAC_WORD_8 (R, 3),	\
Packit 6c4009
		       _FP_FRAC_WORD_8 (R, 2));				\
Packit 6c4009
      __FP_FRAC_ADD_3 (_FP_FRAC_WORD_8 (R, 4), _FP_FRAC_WORD_8 (R, 3),	\
Packit 6c4009
		       _FP_FRAC_WORD_8 (R, 2), 0,			\
Packit 6c4009
		       _FP_MUL_MEAT_DW_4_wide_f_f1,			\
Packit 6c4009
		       _FP_MUL_MEAT_DW_4_wide_f_f0,			\
Packit 6c4009
		       _FP_FRAC_WORD_8 (R, 4), _FP_FRAC_WORD_8 (R, 3),	\
Packit 6c4009
		       _FP_FRAC_WORD_8 (R, 2));				\
Packit 6c4009
      doit (_FP_MUL_MEAT_DW_4_wide_b_f1,				\
Packit 6c4009
	    _FP_MUL_MEAT_DW_4_wide_b_f0, X##_f[0], Y##_f[3]);		\
Packit 6c4009
      doit (_FP_MUL_MEAT_DW_4_wide_c_f1,				\
Packit 6c4009
	    _FP_MUL_MEAT_DW_4_wide_c_f0, X##_f[3], Y##_f[0]);		\
Packit 6c4009
      doit (_FP_MUL_MEAT_DW_4_wide_d_f1, _FP_MUL_MEAT_DW_4_wide_d_f0,	\
Packit 6c4009
	    X##_f[1], Y##_f[2]);					\
Packit 6c4009
      doit (_FP_MUL_MEAT_DW_4_wide_e_f1, _FP_MUL_MEAT_DW_4_wide_e_f0,	\
Packit 6c4009
	    X##_f[2], Y##_f[1]);					\
Packit 6c4009
      __FP_FRAC_ADD_3 (_FP_FRAC_WORD_8 (R, 5), _FP_FRAC_WORD_8 (R, 4),	\
Packit 6c4009
		       _FP_FRAC_WORD_8 (R, 3), 0,			\
Packit 6c4009
		       _FP_MUL_MEAT_DW_4_wide_b_f1,			\
Packit 6c4009
		       _FP_MUL_MEAT_DW_4_wide_b_f0,			\
Packit 6c4009
		       0, _FP_FRAC_WORD_8 (R, 4), _FP_FRAC_WORD_8 (R, 3)); \
Packit 6c4009
      __FP_FRAC_ADD_3 (_FP_FRAC_WORD_8 (R, 5), _FP_FRAC_WORD_8 (R, 4),	\
Packit 6c4009
		       _FP_FRAC_WORD_8 (R, 3), 0,			\
Packit 6c4009
		       _FP_MUL_MEAT_DW_4_wide_c_f1,			\
Packit 6c4009
		       _FP_MUL_MEAT_DW_4_wide_c_f0,			\
Packit 6c4009
		       _FP_FRAC_WORD_8 (R, 5), _FP_FRAC_WORD_8 (R, 4),	\
Packit 6c4009
		       _FP_FRAC_WORD_8 (R, 3));				\
Packit 6c4009
      __FP_FRAC_ADD_3 (_FP_FRAC_WORD_8 (R, 5), _FP_FRAC_WORD_8 (R, 4),	\
Packit 6c4009
		       _FP_FRAC_WORD_8 (R, 3), 0,			\
Packit 6c4009
		       _FP_MUL_MEAT_DW_4_wide_d_f1,			\
Packit 6c4009
		       _FP_MUL_MEAT_DW_4_wide_d_f0,			\
Packit 6c4009
		       _FP_FRAC_WORD_8 (R, 5), _FP_FRAC_WORD_8 (R, 4),	\
Packit 6c4009
		       _FP_FRAC_WORD_8 (R, 3));				\
Packit 6c4009
      __FP_FRAC_ADD_3 (_FP_FRAC_WORD_8 (R, 5), _FP_FRAC_WORD_8 (R, 4),	\
Packit 6c4009
		       _FP_FRAC_WORD_8 (R, 3), 0,			\
Packit 6c4009
		       _FP_MUL_MEAT_DW_4_wide_e_f1,			\
Packit 6c4009
		       _FP_MUL_MEAT_DW_4_wide_e_f0,			\
Packit 6c4009
		       _FP_FRAC_WORD_8 (R, 5), _FP_FRAC_WORD_8 (R, 4),	\
Packit 6c4009
		       _FP_FRAC_WORD_8 (R, 3));				\
Packit 6c4009
      doit (_FP_MUL_MEAT_DW_4_wide_b_f1, _FP_MUL_MEAT_DW_4_wide_b_f0,	\
Packit 6c4009
	    X##_f[2], Y##_f[2]);					\
Packit 6c4009
      doit (_FP_MUL_MEAT_DW_4_wide_c_f1, _FP_MUL_MEAT_DW_4_wide_c_f0,	\
Packit 6c4009
	    X##_f[1], Y##_f[3]);					\
Packit 6c4009
      doit (_FP_MUL_MEAT_DW_4_wide_d_f1, _FP_MUL_MEAT_DW_4_wide_d_f0,	\
Packit 6c4009
	    X##_f[3], Y##_f[1]);					\
Packit 6c4009
      doit (_FP_MUL_MEAT_DW_4_wide_e_f1, _FP_MUL_MEAT_DW_4_wide_e_f0,	\
Packit 6c4009
	    X##_f[2], Y##_f[3]);					\
Packit 6c4009
      doit (_FP_MUL_MEAT_DW_4_wide_f_f1, _FP_MUL_MEAT_DW_4_wide_f_f0,	\
Packit 6c4009
	    X##_f[3], Y##_f[2]);					\
Packit 6c4009
      __FP_FRAC_ADD_3 (_FP_FRAC_WORD_8 (R, 6), _FP_FRAC_WORD_8 (R, 5),	\
Packit 6c4009
		       _FP_FRAC_WORD_8 (R, 4), 0,			\
Packit 6c4009
		       _FP_MUL_MEAT_DW_4_wide_b_f1,			\
Packit 6c4009
		       _FP_MUL_MEAT_DW_4_wide_b_f0,			\
Packit 6c4009
		       0, _FP_FRAC_WORD_8 (R, 5), _FP_FRAC_WORD_8 (R, 4)); \
Packit 6c4009
      __FP_FRAC_ADD_3 (_FP_FRAC_WORD_8 (R, 6), _FP_FRAC_WORD_8 (R, 5),	\
Packit 6c4009
		       _FP_FRAC_WORD_8 (R, 4), 0,			\
Packit 6c4009
		       _FP_MUL_MEAT_DW_4_wide_c_f1,			\
Packit 6c4009
		       _FP_MUL_MEAT_DW_4_wide_c_f0,			\
Packit 6c4009
		       _FP_FRAC_WORD_8 (R, 6), _FP_FRAC_WORD_8 (R, 5),	\
Packit 6c4009
		       _FP_FRAC_WORD_8 (R, 4));				\
Packit 6c4009
      __FP_FRAC_ADD_3 (_FP_FRAC_WORD_8 (R, 6), _FP_FRAC_WORD_8 (R, 5),	\
Packit 6c4009
		       _FP_FRAC_WORD_8 (R, 4), 0,			\
Packit 6c4009
		       _FP_MUL_MEAT_DW_4_wide_d_f1,			\
Packit 6c4009
		       _FP_MUL_MEAT_DW_4_wide_d_f0,			\
Packit 6c4009
		       _FP_FRAC_WORD_8 (R, 6), _FP_FRAC_WORD_8 (R, 5),	\
Packit 6c4009
		       _FP_FRAC_WORD_8 (R, 4));				\
Packit 6c4009
      __FP_FRAC_ADD_3 (_FP_FRAC_WORD_8 (R, 7), _FP_FRAC_WORD_8 (R, 6),	\
Packit 6c4009
		       _FP_FRAC_WORD_8 (R, 5), 0,			\
Packit 6c4009
		       _FP_MUL_MEAT_DW_4_wide_e_f1,			\
Packit 6c4009
		       _FP_MUL_MEAT_DW_4_wide_e_f0,			\
Packit 6c4009
		       0, _FP_FRAC_WORD_8 (R, 6), _FP_FRAC_WORD_8 (R, 5)); \
Packit 6c4009
      __FP_FRAC_ADD_3 (_FP_FRAC_WORD_8 (R, 7), _FP_FRAC_WORD_8 (R, 6),	\
Packit 6c4009
		       _FP_FRAC_WORD_8 (R, 5), 0,			\
Packit 6c4009
		       _FP_MUL_MEAT_DW_4_wide_f_f1,			\
Packit 6c4009
		       _FP_MUL_MEAT_DW_4_wide_f_f0,			\
Packit 6c4009
		       _FP_FRAC_WORD_8 (R, 7), _FP_FRAC_WORD_8 (R, 6),	\
Packit 6c4009
		       _FP_FRAC_WORD_8 (R, 5));				\
Packit 6c4009
      doit (_FP_MUL_MEAT_DW_4_wide_b_f1, _FP_MUL_MEAT_DW_4_wide_b_f0,	\
Packit 6c4009
	    X##_f[3], Y##_f[3]);					\
Packit 6c4009
      __FP_FRAC_ADD_2 (_FP_FRAC_WORD_8 (R, 7), _FP_FRAC_WORD_8 (R, 6),	\
Packit 6c4009
		       _FP_MUL_MEAT_DW_4_wide_b_f1,			\
Packit 6c4009
		       _FP_MUL_MEAT_DW_4_wide_b_f0,			\
Packit 6c4009
		       _FP_FRAC_WORD_8 (R, 7), _FP_FRAC_WORD_8 (R, 6));	\
Packit 6c4009
    }									\
Packit 6c4009
  while (0)
Packit 6c4009
Packit 6c4009
#define _FP_MUL_MEAT_4_wide(wfracbits, R, X, Y, doit)			\
Packit 6c4009
  do									\
Packit 6c4009
    {									\
Packit 6c4009
      _FP_FRAC_DECL_8 (_FP_MUL_MEAT_4_wide_z);				\
Packit 6c4009
									\
Packit 6c4009
      _FP_MUL_MEAT_DW_4_wide ((wfracbits), _FP_MUL_MEAT_4_wide_z,	\
Packit 6c4009
			      X, Y, doit);				\
Packit 6c4009
									\
Packit 6c4009
      /* Normalize since we know where the msb of the multiplicands	\
Packit 6c4009
	 were (bit B), we know that the msb of the of the product is	\
Packit 6c4009
	 at either 2B or 2B-1.  */					\
Packit 6c4009
      _FP_FRAC_SRS_8 (_FP_MUL_MEAT_4_wide_z, (wfracbits)-1,		\
Packit 6c4009
		      2*(wfracbits));					\
Packit 6c4009
      __FP_FRAC_SET_4 (R, _FP_FRAC_WORD_8 (_FP_MUL_MEAT_4_wide_z, 3),	\
Packit 6c4009
		       _FP_FRAC_WORD_8 (_FP_MUL_MEAT_4_wide_z, 2),	\
Packit 6c4009
		       _FP_FRAC_WORD_8 (_FP_MUL_MEAT_4_wide_z, 1),	\
Packit 6c4009
		       _FP_FRAC_WORD_8 (_FP_MUL_MEAT_4_wide_z, 0));	\
Packit 6c4009
    }									\
Packit 6c4009
  while (0)
Packit 6c4009
Packit 6c4009
#define _FP_MUL_MEAT_DW_4_gmp(wfracbits, R, X, Y)	\
Packit 6c4009
  do							\
Packit 6c4009
    {							\
Packit 6c4009
      mpn_mul_n (R##_f, _x_f, _y_f, 4);			\
Packit 6c4009
    }							\
Packit 6c4009
  while (0)
Packit 6c4009
Packit 6c4009
#define _FP_MUL_MEAT_4_gmp(wfracbits, R, X, Y)				\
Packit 6c4009
  do									\
Packit 6c4009
    {									\
Packit 6c4009
      _FP_FRAC_DECL_8 (_FP_MUL_MEAT_4_gmp_z);				\
Packit 6c4009
									\
Packit 6c4009
      _FP_MUL_MEAT_DW_4_gmp ((wfracbits), _FP_MUL_MEAT_4_gmp_z, X, Y);	\
Packit 6c4009
									\
Packit 6c4009
      /* Normalize since we know where the msb of the multiplicands	\
Packit 6c4009
	 were (bit B), we know that the msb of the of the product is	\
Packit 6c4009
	 at either 2B or 2B-1.  */					\
Packit 6c4009
      _FP_FRAC_SRS_8 (_FP_MUL_MEAT_4_gmp_z, (wfracbits)-1,		\
Packit 6c4009
		      2*(wfracbits));					\
Packit 6c4009
      __FP_FRAC_SET_4 (R, _FP_FRAC_WORD_8 (_FP_MUL_MEAT_4_gmp_z, 3),	\
Packit 6c4009
		       _FP_FRAC_WORD_8 (_FP_MUL_MEAT_4_gmp_z, 2),	\
Packit 6c4009
		       _FP_FRAC_WORD_8 (_FP_MUL_MEAT_4_gmp_z, 1),	\
Packit 6c4009
		       _FP_FRAC_WORD_8 (_FP_MUL_MEAT_4_gmp_z, 0));	\
Packit 6c4009
    }									\
Packit 6c4009
  while (0)
Packit 6c4009
Packit 6c4009
/* Helper utility for _FP_DIV_MEAT_4_udiv:
Packit 6c4009
 * pppp = m * nnn.  */
Packit 6c4009
#define umul_ppppmnnn(p3, p2, p1, p0, m, n2, n1, n0)	\
Packit 6c4009
  do							\
Packit 6c4009
    {							\
Packit 6c4009
      UWtype umul_ppppmnnn_t;				\
Packit 6c4009
      umul_ppmm (p1, p0, m, n0);			\
Packit 6c4009
      umul_ppmm (p2, umul_ppppmnnn_t, m, n1);		\
Packit 6c4009
      __FP_FRAC_ADDI_2 (p2, p1, umul_ppppmnnn_t);	\
Packit 6c4009
      umul_ppmm (p3, umul_ppppmnnn_t, m, n2);		\
Packit 6c4009
      __FP_FRAC_ADDI_2 (p3, p2, umul_ppppmnnn_t);	\
Packit 6c4009
    }							\
Packit 6c4009
  while (0)
Packit 6c4009
Packit 6c4009
/* Division algorithms: */
Packit 6c4009
Packit 6c4009
#define _FP_DIV_MEAT_4_udiv(fs, R, X, Y)				\
Packit 6c4009
  do									\
Packit 6c4009
    {									\
Packit 6c4009
      int _FP_DIV_MEAT_4_udiv_i;					\
Packit 6c4009
      _FP_FRAC_DECL_4 (_FP_DIV_MEAT_4_udiv_n);				\
Packit 6c4009
      _FP_FRAC_DECL_4 (_FP_DIV_MEAT_4_udiv_m);				\
Packit 6c4009
      _FP_FRAC_SET_4 (_FP_DIV_MEAT_4_udiv_n, _FP_ZEROFRAC_4);		\
Packit 6c4009
      if (_FP_FRAC_GE_4 (X, Y))						\
Packit 6c4009
	{								\
Packit 6c4009
	  _FP_DIV_MEAT_4_udiv_n_f[3]					\
Packit 6c4009
	    = X##_f[0] << (_FP_W_TYPE_SIZE - 1);			\
Packit 6c4009
	  _FP_FRAC_SRL_4 (X, 1);					\
Packit 6c4009
	}								\
Packit 6c4009
      else								\
Packit 6c4009
	R##_e--;							\
Packit 6c4009
									\
Packit 6c4009
      /* Normalize, i.e. make the most significant bit of the		\
Packit 6c4009
	 denominator set.  */						\
Packit 6c4009
      _FP_FRAC_SLL_4 (Y, _FP_WFRACXBITS_##fs);				\
Packit 6c4009
									\
Packit 6c4009
      for (_FP_DIV_MEAT_4_udiv_i = 3; ; _FP_DIV_MEAT_4_udiv_i--)	\
Packit 6c4009
	{								\
Packit 6c4009
	  if (X##_f[3] == Y##_f[3])					\
Packit 6c4009
	    {								\
Packit 6c4009
	      /* This is a special case, not an optimization		\
Packit 6c4009
		 (X##_f[3]/Y##_f[3] would not fit into UWtype).		\
Packit 6c4009
		 As X## is guaranteed to be < Y,			\
Packit 6c4009
		 R##_f[_FP_DIV_MEAT_4_udiv_i] can be either		\
Packit 6c4009
		 (UWtype)-1 or (UWtype)-2.  */				\
Packit 6c4009
	      R##_f[_FP_DIV_MEAT_4_udiv_i] = -1;			\
Packit 6c4009
	      if (!_FP_DIV_MEAT_4_udiv_i)				\
Packit 6c4009
		break;							\
Packit 6c4009
	      __FP_FRAC_SUB_4 (X##_f[3], X##_f[2], X##_f[1], X##_f[0],	\
Packit 6c4009
			       Y##_f[2], Y##_f[1], Y##_f[0], 0,		\
Packit 6c4009
			       X##_f[2], X##_f[1], X##_f[0],		\
Packit 6c4009
			       _FP_DIV_MEAT_4_udiv_n_f[_FP_DIV_MEAT_4_udiv_i]); \
Packit 6c4009
	      _FP_FRAC_SUB_4 (X, Y, X);					\
Packit 6c4009
	      if (X##_f[3] > Y##_f[3])					\
Packit 6c4009
		{							\
Packit 6c4009
		  R##_f[_FP_DIV_MEAT_4_udiv_i] = -2;			\
Packit 6c4009
		  _FP_FRAC_ADD_4 (X, Y, X);				\
Packit 6c4009
		}							\
Packit 6c4009
	    }								\
Packit 6c4009
	  else								\
Packit 6c4009
	    {								\
Packit 6c4009
	      udiv_qrnnd (R##_f[_FP_DIV_MEAT_4_udiv_i],			\
Packit 6c4009
			  X##_f[3], X##_f[3], X##_f[2], Y##_f[3]);	\
Packit 6c4009
	      umul_ppppmnnn (_FP_DIV_MEAT_4_udiv_m_f[3],		\
Packit 6c4009
			     _FP_DIV_MEAT_4_udiv_m_f[2],		\
Packit 6c4009
			     _FP_DIV_MEAT_4_udiv_m_f[1],		\
Packit 6c4009
			     _FP_DIV_MEAT_4_udiv_m_f[0],		\
Packit 6c4009
			     R##_f[_FP_DIV_MEAT_4_udiv_i],		\
Packit 6c4009
			     Y##_f[2], Y##_f[1], Y##_f[0]);		\
Packit 6c4009
	      X##_f[2] = X##_f[1];					\
Packit 6c4009
	      X##_f[1] = X##_f[0];					\
Packit 6c4009
	      X##_f[0]							\
Packit 6c4009
		= _FP_DIV_MEAT_4_udiv_n_f[_FP_DIV_MEAT_4_udiv_i];	\
Packit 6c4009
	      if (_FP_FRAC_GT_4 (_FP_DIV_MEAT_4_udiv_m, X))		\
Packit 6c4009
		{							\
Packit 6c4009
		  R##_f[_FP_DIV_MEAT_4_udiv_i]--;			\
Packit 6c4009
		  _FP_FRAC_ADD_4 (X, Y, X);				\
Packit 6c4009
		  if (_FP_FRAC_GE_4 (X, Y)				\
Packit 6c4009
		      && _FP_FRAC_GT_4 (_FP_DIV_MEAT_4_udiv_m, X))	\
Packit 6c4009
		    {							\
Packit 6c4009
		      R##_f[_FP_DIV_MEAT_4_udiv_i]--;			\
Packit 6c4009
		      _FP_FRAC_ADD_4 (X, Y, X);				\
Packit 6c4009
		    }							\
Packit 6c4009
		}							\
Packit 6c4009
	      _FP_FRAC_DEC_4 (X, _FP_DIV_MEAT_4_udiv_m);		\
Packit 6c4009
	      if (!_FP_DIV_MEAT_4_udiv_i)				\
Packit 6c4009
		{							\
Packit 6c4009
		  if (!_FP_FRAC_EQ_4 (X, _FP_DIV_MEAT_4_udiv_m))	\
Packit 6c4009
		    R##_f[0] |= _FP_WORK_STICKY;			\
Packit 6c4009
		  break;						\
Packit 6c4009
		}							\
Packit 6c4009
	    }								\
Packit 6c4009
	}								\
Packit 6c4009
    }									\
Packit 6c4009
  while (0)
Packit 6c4009
Packit 6c4009
Packit 6c4009
/* Square root algorithms:
Packit 6c4009
   We have just one right now, maybe Newton approximation
Packit 6c4009
   should be added for those machines where division is fast.  */
Packit 6c4009
Packit 6c4009
#define _FP_SQRT_MEAT_4(R, S, T, X, q)					\
Packit 6c4009
  do									\
Packit 6c4009
    {									\
Packit 6c4009
      while (q)								\
Packit 6c4009
	{								\
Packit 6c4009
	  T##_f[3] = S##_f[3] + (q);					\
Packit 6c4009
	  if (T##_f[3] <= X##_f[3])					\
Packit 6c4009
	    {								\
Packit 6c4009
	      S##_f[3] = T##_f[3] + (q);				\
Packit 6c4009
	      X##_f[3] -= T##_f[3];					\
Packit 6c4009
	      R##_f[3] += (q);						\
Packit 6c4009
	    }								\
Packit 6c4009
	  _FP_FRAC_SLL_4 (X, 1);					\
Packit 6c4009
	  (q) >>= 1;							\
Packit 6c4009
	}								\
Packit 6c4009
      (q) = (_FP_W_TYPE) 1 << (_FP_W_TYPE_SIZE - 1);			\
Packit 6c4009
      while (q)								\
Packit 6c4009
	{								\
Packit 6c4009
	  T##_f[2] = S##_f[2] + (q);					\
Packit 6c4009
	  T##_f[3] = S##_f[3];						\
Packit 6c4009
	  if (T##_f[3] < X##_f[3]					\
Packit 6c4009
	      || (T##_f[3] == X##_f[3] && T##_f[2] <= X##_f[2]))	\
Packit 6c4009
	    {								\
Packit 6c4009
	      S##_f[2] = T##_f[2] + (q);				\
Packit 6c4009
	      S##_f[3] += (T##_f[2] > S##_f[2]);			\
Packit 6c4009
	      __FP_FRAC_DEC_2 (X##_f[3], X##_f[2],			\
Packit 6c4009
			       T##_f[3], T##_f[2]);			\
Packit 6c4009
	      R##_f[2] += (q);						\
Packit 6c4009
	    }								\
Packit 6c4009
	  _FP_FRAC_SLL_4 (X, 1);					\
Packit 6c4009
	  (q) >>= 1;							\
Packit 6c4009
	}								\
Packit 6c4009
      (q) = (_FP_W_TYPE) 1 << (_FP_W_TYPE_SIZE - 1);			\
Packit 6c4009
      while (q)								\
Packit 6c4009
	{								\
Packit 6c4009
	  T##_f[1] = S##_f[1] + (q);					\
Packit 6c4009
	  T##_f[2] = S##_f[2];						\
Packit 6c4009
	  T##_f[3] = S##_f[3];						\
Packit 6c4009
	  if (T##_f[3] < X##_f[3]					\
Packit 6c4009
	      || (T##_f[3] == X##_f[3]					\
Packit 6c4009
		  && (T##_f[2] < X##_f[2]				\
Packit 6c4009
		      || (T##_f[2] == X##_f[2]				\
Packit 6c4009
			  && T##_f[1] <= X##_f[1]))))			\
Packit 6c4009
	    {								\
Packit 6c4009
	      S##_f[1] = T##_f[1] + (q);				\
Packit 6c4009
	      S##_f[2] += (T##_f[1] > S##_f[1]);			\
Packit 6c4009
	      S##_f[3] += (T##_f[2] > S##_f[2]);			\
Packit 6c4009
	      __FP_FRAC_DEC_3 (X##_f[3], X##_f[2], X##_f[1],		\
Packit 6c4009
			       T##_f[3], T##_f[2], T##_f[1]);		\
Packit 6c4009
	      R##_f[1] += (q);						\
Packit 6c4009
	    }								\
Packit 6c4009
	  _FP_FRAC_SLL_4 (X, 1);					\
Packit 6c4009
	  (q) >>= 1;							\
Packit 6c4009
	}								\
Packit 6c4009
      (q) = (_FP_W_TYPE) 1 << (_FP_W_TYPE_SIZE - 1);			\
Packit 6c4009
      while ((q) != _FP_WORK_ROUND)					\
Packit 6c4009
	{								\
Packit 6c4009
	  T##_f[0] = S##_f[0] + (q);					\
Packit 6c4009
	  T##_f[1] = S##_f[1];						\
Packit 6c4009
	  T##_f[2] = S##_f[2];						\
Packit 6c4009
	  T##_f[3] = S##_f[3];						\
Packit 6c4009
	  if (_FP_FRAC_GE_4 (X, T))					\
Packit 6c4009
	    {								\
Packit 6c4009
	      S##_f[0] = T##_f[0] + (q);				\
Packit 6c4009
	      S##_f[1] += (T##_f[0] > S##_f[0]);			\
Packit 6c4009
	      S##_f[2] += (T##_f[1] > S##_f[1]);			\
Packit 6c4009
	      S##_f[3] += (T##_f[2] > S##_f[2]);			\
Packit 6c4009
	      _FP_FRAC_DEC_4 (X, T);					\
Packit 6c4009
	      R##_f[0] += (q);						\
Packit 6c4009
	    }								\
Packit 6c4009
	  _FP_FRAC_SLL_4 (X, 1);					\
Packit 6c4009
	  (q) >>= 1;							\
Packit 6c4009
	}								\
Packit 6c4009
      if (!_FP_FRAC_ZEROP_4 (X))					\
Packit 6c4009
	{								\
Packit 6c4009
	  if (_FP_FRAC_GT_4 (X, S))					\
Packit 6c4009
	    R##_f[0] |= _FP_WORK_ROUND;					\
Packit 6c4009
	  R##_f[0] |= _FP_WORK_STICKY;					\
Packit 6c4009
	}								\
Packit 6c4009
    }									\
Packit 6c4009
  while (0)
Packit 6c4009
Packit 6c4009
Packit 6c4009
/* Internals.  */
Packit 6c4009
Packit 6c4009
#define __FP_FRAC_SET_4(X, I3, I2, I1, I0)			\
Packit 6c4009
  (X##_f[3] = I3, X##_f[2] = I2, X##_f[1] = I1, X##_f[0] = I0)
Packit 6c4009
Packit 6c4009
#ifndef __FP_FRAC_ADD_3
Packit 6c4009
# define __FP_FRAC_ADD_3(r2, r1, r0, x2, x1, x0, y2, y1, y0)	\
Packit 6c4009
  do								\
Packit 6c4009
    {								\
Packit 6c4009
      _FP_W_TYPE __FP_FRAC_ADD_3_c1, __FP_FRAC_ADD_3_c2;	\
Packit 6c4009
      r0 = x0 + y0;						\
Packit 6c4009
      __FP_FRAC_ADD_3_c1 = r0 < x0;				\
Packit 6c4009
      r1 = x1 + y1;						\
Packit 6c4009
      __FP_FRAC_ADD_3_c2 = r1 < x1;				\
Packit 6c4009
      r1 += __FP_FRAC_ADD_3_c1;					\
Packit 6c4009
      __FP_FRAC_ADD_3_c2 |= r1 < __FP_FRAC_ADD_3_c1;		\
Packit 6c4009
      r2 = x2 + y2 + __FP_FRAC_ADD_3_c2;			\
Packit 6c4009
    }								\
Packit 6c4009
  while (0)
Packit 6c4009
#endif
Packit 6c4009
Packit 6c4009
#ifndef __FP_FRAC_ADD_4
Packit 6c4009
# define __FP_FRAC_ADD_4(r3, r2, r1, r0, x3, x2, x1, x0, y3, y2, y1, y0) \
Packit 6c4009
  do									\
Packit 6c4009
    {									\
Packit 6c4009
      _FP_W_TYPE __FP_FRAC_ADD_4_c1, __FP_FRAC_ADD_4_c2;		\
Packit 6c4009
      _FP_W_TYPE __FP_FRAC_ADD_4_c3;					\
Packit 6c4009
      r0 = x0 + y0;							\
Packit 6c4009
      __FP_FRAC_ADD_4_c1 = r0 < x0;					\
Packit 6c4009
      r1 = x1 + y1;							\
Packit 6c4009
      __FP_FRAC_ADD_4_c2 = r1 < x1;					\
Packit 6c4009
      r1 += __FP_FRAC_ADD_4_c1;						\
Packit 6c4009
      __FP_FRAC_ADD_4_c2 |= r1 < __FP_FRAC_ADD_4_c1;			\
Packit 6c4009
      r2 = x2 + y2;							\
Packit 6c4009
      __FP_FRAC_ADD_4_c3 = r2 < x2;					\
Packit 6c4009
      r2 += __FP_FRAC_ADD_4_c2;						\
Packit 6c4009
      __FP_FRAC_ADD_4_c3 |= r2 < __FP_FRAC_ADD_4_c2;			\
Packit 6c4009
      r3 = x3 + y3 + __FP_FRAC_ADD_4_c3;				\
Packit 6c4009
    }									\
Packit 6c4009
  while (0)
Packit 6c4009
#endif
Packit 6c4009
Packit 6c4009
#ifndef __FP_FRAC_SUB_3
Packit 6c4009
# define __FP_FRAC_SUB_3(r2, r1, r0, x2, x1, x0, y2, y1, y0)	\
Packit 6c4009
  do								\
Packit 6c4009
    {								\
Packit 6c4009
      _FP_W_TYPE __FP_FRAC_SUB_3_c1, __FP_FRAC_SUB_3_c2;	\
Packit 6c4009
      r0 = x0 - y0;						\
Packit 6c4009
      __FP_FRAC_SUB_3_c1 = r0 > x0;				\
Packit 6c4009
      r1 = x1 - y1;						\
Packit 6c4009
      __FP_FRAC_SUB_3_c2 = r1 > x1;				\
Packit 6c4009
      r1 -= __FP_FRAC_SUB_3_c1;					\
Packit 6c4009
      __FP_FRAC_SUB_3_c2 |= __FP_FRAC_SUB_3_c1 && (y1 == x1);	\
Packit 6c4009
      r2 = x2 - y2 - __FP_FRAC_SUB_3_c2;			\
Packit 6c4009
    }								\
Packit 6c4009
  while (0)
Packit 6c4009
#endif
Packit 6c4009
Packit 6c4009
#ifndef __FP_FRAC_SUB_4
Packit 6c4009
# define __FP_FRAC_SUB_4(r3, r2, r1, r0, x3, x2, x1, x0, y3, y2, y1, y0) \
Packit 6c4009
  do									\
Packit 6c4009
    {									\
Packit 6c4009
      _FP_W_TYPE __FP_FRAC_SUB_4_c1, __FP_FRAC_SUB_4_c2;		\
Packit 6c4009
      _FP_W_TYPE __FP_FRAC_SUB_4_c3;					\
Packit 6c4009
      r0 = x0 - y0;							\
Packit 6c4009
      __FP_FRAC_SUB_4_c1 = r0 > x0;					\
Packit 6c4009
      r1 = x1 - y1;							\
Packit 6c4009
      __FP_FRAC_SUB_4_c2 = r1 > x1;					\
Packit 6c4009
      r1 -= __FP_FRAC_SUB_4_c1;						\
Packit 6c4009
      __FP_FRAC_SUB_4_c2 |= __FP_FRAC_SUB_4_c1 && (y1 == x1);		\
Packit 6c4009
      r2 = x2 - y2;							\
Packit 6c4009
      __FP_FRAC_SUB_4_c3 = r2 > x2;					\
Packit 6c4009
      r2 -= __FP_FRAC_SUB_4_c2;						\
Packit 6c4009
      __FP_FRAC_SUB_4_c3 |= __FP_FRAC_SUB_4_c2 && (y2 == x2);		\
Packit 6c4009
      r3 = x3 - y3 - __FP_FRAC_SUB_4_c3;				\
Packit 6c4009
    }									\
Packit 6c4009
  while (0)
Packit 6c4009
#endif
Packit 6c4009
Packit 6c4009
#ifndef __FP_FRAC_DEC_3
Packit 6c4009
# define __FP_FRAC_DEC_3(x2, x1, x0, y2, y1, y0)		\
Packit 6c4009
  do								\
Packit 6c4009
    {								\
Packit 6c4009
      UWtype __FP_FRAC_DEC_3_t0, __FP_FRAC_DEC_3_t1;		\
Packit 6c4009
      UWtype __FP_FRAC_DEC_3_t2;				\
Packit 6c4009
      __FP_FRAC_DEC_3_t0 = x0;					\
Packit 6c4009
      __FP_FRAC_DEC_3_t1 = x1;					\
Packit 6c4009
      __FP_FRAC_DEC_3_t2 = x2;					\
Packit 6c4009
      __FP_FRAC_SUB_3 (x2, x1, x0, __FP_FRAC_DEC_3_t2,		\
Packit 6c4009
		       __FP_FRAC_DEC_3_t1, __FP_FRAC_DEC_3_t0,	\
Packit 6c4009
		       y2, y1, y0);				\
Packit 6c4009
    }								\
Packit 6c4009
  while (0)
Packit 6c4009
#endif
Packit 6c4009
Packit 6c4009
#ifndef __FP_FRAC_DEC_4
Packit 6c4009
# define __FP_FRAC_DEC_4(x3, x2, x1, x0, y3, y2, y1, y0)	\
Packit 6c4009
  do								\
Packit 6c4009
    {								\
Packit 6c4009
      UWtype __FP_FRAC_DEC_4_t0, __FP_FRAC_DEC_4_t1;		\
Packit 6c4009
      UWtype __FP_FRAC_DEC_4_t2, __FP_FRAC_DEC_4_t3;		\
Packit 6c4009
      __FP_FRAC_DEC_4_t0 = x0;					\
Packit 6c4009
      __FP_FRAC_DEC_4_t1 = x1;					\
Packit 6c4009
      __FP_FRAC_DEC_4_t2 = x2;					\
Packit 6c4009
      __FP_FRAC_DEC_4_t3 = x3;					\
Packit 6c4009
      __FP_FRAC_SUB_4 (x3, x2, x1, x0, __FP_FRAC_DEC_4_t3,	\
Packit 6c4009
		       __FP_FRAC_DEC_4_t2, __FP_FRAC_DEC_4_t1,	\
Packit 6c4009
		       __FP_FRAC_DEC_4_t0, y3, y2, y1, y0);	\
Packit 6c4009
    }								\
Packit 6c4009
  while (0)
Packit 6c4009
#endif
Packit 6c4009
Packit 6c4009
#ifndef __FP_FRAC_ADDI_4
Packit 6c4009
# define __FP_FRAC_ADDI_4(x3, x2, x1, x0, i)		\
Packit 6c4009
  do							\
Packit 6c4009
    {							\
Packit 6c4009
      UWtype __FP_FRAC_ADDI_4_t;			\
Packit 6c4009
      __FP_FRAC_ADDI_4_t = ((x0 += i) < i);		\
Packit 6c4009
      x1 += __FP_FRAC_ADDI_4_t;				\
Packit 6c4009
      __FP_FRAC_ADDI_4_t = (x1 < __FP_FRAC_ADDI_4_t);	\
Packit 6c4009
      x2 += __FP_FRAC_ADDI_4_t;				\
Packit 6c4009
      __FP_FRAC_ADDI_4_t = (x2 < __FP_FRAC_ADDI_4_t);	\
Packit 6c4009
      x3 += __FP_FRAC_ADDI_4_t;				\
Packit 6c4009
    }							\
Packit 6c4009
  while (0)
Packit 6c4009
#endif
Packit 6c4009
Packit 6c4009
/* Convert FP values between word sizes. This appears to be more
Packit 6c4009
   complicated than I'd have expected it to be, so these might be
Packit 6c4009
   wrong... These macros are in any case somewhat bogus because they
Packit 6c4009
   use information about what various FRAC_n variables look like
Packit 6c4009
   internally [eg, that 2 word vars are X_f0 and x_f1]. But so do
Packit 6c4009
   the ones in op-2.h and op-1.h.  */
Packit 6c4009
#define _FP_FRAC_COPY_1_4(D, S)		(D##_f = S##_f[0])
Packit 6c4009
Packit 6c4009
#define _FP_FRAC_COPY_2_4(D, S)			\
Packit 6c4009
  do						\
Packit 6c4009
    {						\
Packit 6c4009
      D##_f0 = S##_f[0];			\
Packit 6c4009
      D##_f1 = S##_f[1];			\
Packit 6c4009
    }						\
Packit 6c4009
  while (0)
Packit 6c4009
Packit 6c4009
/* Assembly/disassembly for converting to/from integral types.
Packit 6c4009
   No shifting or overflow handled here.  */
Packit 6c4009
/* Put the FP value X into r, which is an integer of size rsize.  */
Packit 6c4009
#define _FP_FRAC_ASSEMBLE_4(r, X, rsize)				\
Packit 6c4009
  do									\
Packit 6c4009
    {									\
Packit 6c4009
      if ((rsize) <= _FP_W_TYPE_SIZE)					\
Packit 6c4009
	(r) = X##_f[0];							\
Packit 6c4009
	else if ((rsize) <= 2*_FP_W_TYPE_SIZE)				\
Packit 6c4009
	{								\
Packit 6c4009
	  (r) = X##_f[1];						\
Packit 6c4009
	  (r) = ((rsize) <= _FP_W_TYPE_SIZE				\
Packit 6c4009
		 ? 0							\
Packit 6c4009
		 : (r) << _FP_W_TYPE_SIZE);				\
Packit 6c4009
	  (r) += X##_f[0];						\
Packit 6c4009
	}								\
Packit 6c4009
      else								\
Packit 6c4009
	{								\
Packit 6c4009
	  /* I'm feeling lazy so we deal with int == 3words		\
Packit 6c4009
	     (implausible) and int == 4words as a single case.  */	\
Packit 6c4009
	  (r) = X##_f[3];						\
Packit 6c4009
	  (r) = ((rsize) <= _FP_W_TYPE_SIZE				\
Packit 6c4009
		 ? 0							\
Packit 6c4009
		 : (r) << _FP_W_TYPE_SIZE);				\
Packit 6c4009
	  (r) += X##_f[2];						\
Packit 6c4009
	  (r) = ((rsize) <= _FP_W_TYPE_SIZE				\
Packit 6c4009
		 ? 0							\
Packit 6c4009
		 : (r) << _FP_W_TYPE_SIZE);				\
Packit 6c4009
	  (r) += X##_f[1];						\
Packit 6c4009
	  (r) = ((rsize) <= _FP_W_TYPE_SIZE				\
Packit 6c4009
		 ? 0							\
Packit 6c4009
		 : (r) << _FP_W_TYPE_SIZE);				\
Packit 6c4009
	  (r) += X##_f[0];						\
Packit 6c4009
	}								\
Packit 6c4009
    }									\
Packit 6c4009
  while (0)
Packit 6c4009
Packit 6c4009
/* "No disassemble Number Five!" */
Packit 6c4009
/* Move an integer of size rsize into X's fractional part. We rely on
Packit 6c4009
   the _f[] array consisting of words of size _FP_W_TYPE_SIZE to avoid
Packit 6c4009
   having to mask the values we store into it.  */
Packit 6c4009
#define _FP_FRAC_DISASSEMBLE_4(X, r, rsize)	\
Packit 6c4009
  do						\
Packit 6c4009
    {						\
Packit 6c4009
      X##_f[0] = (r);				\
Packit 6c4009
      X##_f[1] = ((rsize) <= _FP_W_TYPE_SIZE	\
Packit 6c4009
		  ? 0				\
Packit 6c4009
		  : (r) >> _FP_W_TYPE_SIZE);	\
Packit 6c4009
      X##_f[2] = ((rsize) <= 2*_FP_W_TYPE_SIZE	\
Packit 6c4009
		  ? 0				\
Packit 6c4009
		  : (r) >> 2*_FP_W_TYPE_SIZE);	\
Packit 6c4009
      X##_f[3] = ((rsize) <= 3*_FP_W_TYPE_SIZE	\
Packit 6c4009
		  ? 0				\
Packit 6c4009
		  : (r) >> 3*_FP_W_TYPE_SIZE);	\
Packit 6c4009
    }						\
Packit 6c4009
  while (0)
Packit 6c4009
Packit 6c4009
#define _FP_FRAC_COPY_4_1(D, S)			\
Packit 6c4009
  do						\
Packit 6c4009
    {						\
Packit 6c4009
      D##_f[0] = S##_f;				\
Packit 6c4009
      D##_f[1] = D##_f[2] = D##_f[3] = 0;	\
Packit 6c4009
    }						\
Packit 6c4009
  while (0)
Packit 6c4009
Packit 6c4009
#define _FP_FRAC_COPY_4_2(D, S)			\
Packit 6c4009
  do						\
Packit 6c4009
    {						\
Packit 6c4009
      D##_f[0] = S##_f0;			\
Packit 6c4009
      D##_f[1] = S##_f1;			\
Packit 6c4009
      D##_f[2] = D##_f[3] = 0;			\
Packit 6c4009
    }						\
Packit 6c4009
  while (0)
Packit 6c4009
Packit 6c4009
#define _FP_FRAC_COPY_4_4(D, S)	_FP_FRAC_COPY_4 (D, S)
Packit 6c4009
Packit 6c4009
#endif /* !SOFT_FP_OP_4_H */