[mirror_ubuntu-jammy-kernel.git] / arch / ppc / math-emu / op-common.h

#define _FP_DECL(wc, X)			\
  _FP_I_TYPE X##_c, X##_s, X##_e;	\
  _FP_FRAC_DECL_##wc(X)

/*
 * Finish truely unpacking a native fp value by classifying the kind
 * of fp value and normalizing both the exponent and the fraction.
 */

#define _FP_UNPACK_CANONICAL(fs, wc, X)					\
do {									\
  switch (X##_e)							\
  {									\
  default:								\
    _FP_FRAC_HIGH_##wc(X) |= _FP_IMPLBIT_##fs;				\
    _FP_FRAC_SLL_##wc(X, _FP_WORKBITS);					\
    X##_e -= _FP_EXPBIAS_##fs;						\
    X##_c = FP_CLS_NORMAL;						\
    break;								\
									\
  case 0:								\
    if (_FP_FRAC_ZEROP_##wc(X))						\
      X##_c = FP_CLS_ZERO;						\
    else								\
      {									\
	/* a denormalized number */					\
	_FP_I_TYPE _shift;						\
	_FP_FRAC_CLZ_##wc(_shift, X);					\
	_shift -= _FP_FRACXBITS_##fs;					\
	_FP_FRAC_SLL_##wc(X, (_shift+_FP_WORKBITS));			\
	X##_e -= _FP_EXPBIAS_##fs - 1 + _shift;				\
	X##_c = FP_CLS_NORMAL;						\
      }									\
    break;								\
									\
  case _FP_EXPMAX_##fs:							\
    if (_FP_FRAC_ZEROP_##wc(X))						\
      X##_c = FP_CLS_INF;						\
    else								\
      /* we don't differentiate between signaling and quiet nans */	\
      X##_c = FP_CLS_NAN;						\
    break;								\
  }									\
} while (0)


/*
 * Before packing the bits back into the native fp result, take care
 * of such mundane things as rounding and overflow.  Also, for some
 * kinds of fp values, the original parts may not have been fully
 * extracted -- but that is ok, we can regenerate them now.
 */

#define _FP_PACK_CANONICAL(fs, wc, X)				\
({int __ret = 0;						\
  switch (X##_c)						\
  {								\
  case FP_CLS_NORMAL:						\
    X##_e += _FP_EXPBIAS_##fs;					\
    if (X##_e > 0)						\
      {								\
	__ret |= _FP_ROUND(wc, X);				\
	if (_FP_FRAC_OVERP_##wc(fs, X))				\
	  {							\
	    _FP_FRAC_SRL_##wc(X, (_FP_WORKBITS+1));		\
	    X##_e++;						\
	  }							\
	else							\
	  _FP_FRAC_SRL_##wc(X, _FP_WORKBITS);			\
	if (X##_e >= _FP_EXPMAX_##fs)				\
	  {							\
	    /* overflow to infinity */				\
	    X##_e = _FP_EXPMAX_##fs;				\
	    _FP_FRAC_SET_##wc(X, _FP_ZEROFRAC_##wc);		\
            __ret |= EFLAG_OVERFLOW;				\
	  }							\
      }								\
    else							\
      {								\
	/* we've got a denormalized number */			\
	X##_e = -X##_e + 1;					\
	if (X##_e <= _FP_WFRACBITS_##fs)			\
	  {							\
	    _FP_FRAC_SRS_##wc(X, X##_e, _FP_WFRACBITS_##fs);	\
	    _FP_FRAC_SLL_##wc(X, 1);				\
	    if (_FP_FRAC_OVERP_##wc(fs, X))			\
	      {							\
	        X##_e = 1;					\
	        _FP_FRAC_SET_##wc(X, _FP_ZEROFRAC_##wc);	\
	      }							\
	    else						\
	      {							\
		X##_e = 0;					\
		_FP_FRAC_SRL_##wc(X, _FP_WORKBITS+1);		\
                __ret |= EFLAG_UNDERFLOW;			\
	      }							\
	  }							\
	else							\
	  {							\
	    /* underflow to zero */				\
	    X##_e = 0;						\
	    _FP_FRAC_SET_##wc(X, _FP_ZEROFRAC_##wc);		\
            __ret |= EFLAG_UNDERFLOW;				\
	  }							\
      }								\
    break;							\
								\
  case FP_CLS_ZERO:						\
    X##_e = 0;							\
    _FP_FRAC_SET_##wc(X, _FP_ZEROFRAC_##wc);			\
    break;							\
								\
  case FP_CLS_INF:						\
    X##_e = _FP_EXPMAX_##fs;					\
    _FP_FRAC_SET_##wc(X, _FP_ZEROFRAC_##wc);			\
    break;							\
								\
  case FP_CLS_NAN:						\
    X##_e = _FP_EXPMAX_##fs;					\
    if (!_FP_KEEPNANFRACP)					\
      {								\
	_FP_FRAC_SET_##wc(X, _FP_NANFRAC_##fs);			\
	X##_s = 0;						\
      }								\
    else							\
      _FP_FRAC_HIGH_##wc(X) |= _FP_QNANBIT_##fs;		\
    break;							\
  }								\
  __ret;							\
})


/*
 * Main addition routine.  The input values should be cooked.
 */

#define _FP_ADD(fs, wc, R, X, Y)					     \
do {									     \
  switch (_FP_CLS_COMBINE(X##_c, Y##_c))				     \
  {									     \
  case _FP_CLS_COMBINE(FP_CLS_NORMAL,FP_CLS_NORMAL):			     \
    {									     \
      /* shift the smaller number so that its exponent matches the larger */ \
      _FP_I_TYPE diff = X##_e - Y##_e;					     \
									     \
      if (diff < 0)							     \
	{								     \
	  diff = -diff;							     \
	  if (diff <= _FP_WFRACBITS_##fs)				     \
	    _FP_FRAC_SRS_##wc(X, diff, _FP_WFRACBITS_##fs);		     \
	  else if (!_FP_FRAC_ZEROP_##wc(X))				     \
	    _FP_FRAC_SET_##wc(X, _FP_MINFRAC_##wc);			     \
	  else								     \
	    _FP_FRAC_SET_##wc(X, _FP_ZEROFRAC_##wc);			     \
	  R##_e = Y##_e;						     \
	}								     \
      else								     \
	{								     \
	  if (diff > 0)							     \
	    {								     \
	      if (diff <= _FP_WFRACBITS_##fs)				     \
	        _FP_FRAC_SRS_##wc(Y, diff, _FP_WFRACBITS_##fs);		     \
	      else if (!_FP_FRAC_ZEROP_##wc(Y))				     \
	        _FP_FRAC_SET_##wc(Y, _FP_MINFRAC_##wc);			     \
	      else							     \
	        _FP_FRAC_SET_##wc(Y, _FP_ZEROFRAC_##wc);		     \
	    }								     \
	  R##_e = X##_e;						     \
	}								     \
									     \
      R##_c = FP_CLS_NORMAL;						     \
									     \
      if (X##_s == Y##_s)						     \
	{								     \
	  R##_s = X##_s;						     \
	  _FP_FRAC_ADD_##wc(R, X, Y);					     \
	  if (_FP_FRAC_OVERP_##wc(fs, R))				     \
	    {								     \
	      _FP_FRAC_SRS_##wc(R, 1, _FP_WFRACBITS_##fs);		     \
	      R##_e++;							     \
	    }								     \
	}								     \
      else								     \
	{								     \
	  R##_s = X##_s;						     \
	  _FP_FRAC_SUB_##wc(R, X, Y);					     \
	  if (_FP_FRAC_ZEROP_##wc(R))					     \
	    {								     \
	      /* return an exact zero */				     \
	      if (FP_ROUNDMODE == FP_RND_MINF)				     \
		R##_s |= Y##_s;						     \
	      else							     \
		R##_s &= Y##_s;						     \
	      R##_c = FP_CLS_ZERO;					     \
	    }								     \
	  else								     \
	    {								     \
	      if (_FP_FRAC_NEGP_##wc(R))				     \
		{							     \
		  _FP_FRAC_SUB_##wc(R, Y, X);				     \
		  R##_s = Y##_s;					     \
		}							     \
									     \
	      /* renormalize after subtraction */			     \
	      _FP_FRAC_CLZ_##wc(diff, R);				     \
	      diff -= _FP_WFRACXBITS_##fs;				     \
	      if (diff)							     \
		{							     \
		  R##_e -= diff;					     \
		  _FP_FRAC_SLL_##wc(R, diff);				     \
		}							     \
	    }								     \
	}								     \
      break;								     \
    }									     \
									     \
  case _FP_CLS_COMBINE(FP_CLS_NAN,FP_CLS_NAN):				     \
    _FP_CHOOSENAN(fs, wc, R, X, Y);					     \
    break;								     \
									     \
  case _FP_CLS_COMBINE(FP_CLS_NORMAL,FP_CLS_ZERO):			     \
    R##_e = X##_e;							     \
  case _FP_CLS_COMBINE(FP_CLS_NAN,FP_CLS_NORMAL):			     \
  case _FP_CLS_COMBINE(FP_CLS_NAN,FP_CLS_INF):				     \
  case _FP_CLS_COMBINE(FP_CLS_NAN,FP_CLS_ZERO):				     \
    _FP_FRAC_COPY_##wc(R, X);						     \
    R##_s = X##_s;							     \
    R##_c = X##_c;							     \
    break;								     \
									     \
  case _FP_CLS_COMBINE(FP_CLS_ZERO,FP_CLS_NORMAL):			     \
    R##_e = Y##_e;							     \
  case _FP_CLS_COMBINE(FP_CLS_NORMAL,FP_CLS_NAN):			     \
  case _FP_CLS_COMBINE(FP_CLS_INF,FP_CLS_NAN):				     \
  case _FP_CLS_COMBINE(FP_CLS_ZERO,FP_CLS_NAN):				     \
    _FP_FRAC_COPY_##wc(R, Y);						     \
    R##_s = Y##_s;							     \
    R##_c = Y##_c;							     \
    break;								     \
									     \
  case _FP_CLS_COMBINE(FP_CLS_INF,FP_CLS_INF):				     \
    if (X##_s != Y##_s)							     \
      {									     \
	/* +INF + -INF => NAN */					     \
	_FP_FRAC_SET_##wc(R, _FP_NANFRAC_##fs);				     \
	R##_s = X##_s ^ Y##_s;						     \
	R##_c = FP_CLS_NAN;						     \
	break;								     \
      }									     \
    /* FALLTHRU */							     \
									     \
  case _FP_CLS_COMBINE(FP_CLS_INF,FP_CLS_NORMAL):			     \
  case _FP_CLS_COMBINE(FP_CLS_INF,FP_CLS_ZERO):				     \
    R##_s = X##_s;							     \
    R##_c = FP_CLS_INF;							     \
    break;								     \
									     \
  case _FP_CLS_COMBINE(FP_CLS_NORMAL,FP_CLS_INF):			     \
  case _FP_CLS_COMBINE(FP_CLS_ZERO,FP_CLS_INF):				     \
    R##_s = Y##_s;							     \
    R##_c = FP_CLS_INF;							     \
    break;								     \
									     \
  case _FP_CLS_COMBINE(FP_CLS_ZERO,FP_CLS_ZERO):			     \
    /* make sure the sign is correct */					     \
    if (FP_ROUNDMODE == FP_RND_MINF)					     \
      R##_s = X##_s | Y##_s;						     \
    else								     \
      R##_s = X##_s & Y##_s;						     \
    R##_c = FP_CLS_ZERO;						     \
    break;								     \
									     \
  default:								     \
    abort();								     \
  }									     \
} while (0)


/*
 * Main negation routine.  FIXME -- when we care about setting exception
 * bits reliably, this will not do.  We should examine all of the fp classes.
 */

#define _FP_NEG(fs, wc, R, X)		\
  do {					\
    _FP_FRAC_COPY_##wc(R, X);		\
    R##_c = X##_c;			\
    R##_e = X##_e;			\
    R##_s = 1 ^ X##_s;			\
  } while (0)


/*
 * Main multiplication routine.  The input values should be cooked.
 */

#define _FP_MUL(fs, wc, R, X, Y)			\
do {							\
  R##_s = X##_s ^ Y##_s;				\
  switch (_FP_CLS_COMBINE(X##_c, Y##_c))		\
  {							\
  case _FP_CLS_COMBINE(FP_CLS_NORMAL,FP_CLS_NORMAL):	\
    R##_c = FP_CLS_NORMAL;				\
    R##_e = X##_e + Y##_e + 1;				\
							\
    _FP_MUL_MEAT_##fs(R,X,Y);				\
							\
    if (_FP_FRAC_OVERP_##wc(fs, R))			\
      _FP_FRAC_SRS_##wc(R, 1, _FP_WFRACBITS_##fs);	\
    else						\
      R##_e--;						\
    break;						\
							\
  case _FP_CLS_COMBINE(FP_CLS_NAN,FP_CLS_NAN):		\
    _FP_CHOOSENAN(fs, wc, R, X, Y);			\
    break;						\
							\
  case _FP_CLS_COMBINE(FP_CLS_NAN,FP_CLS_NORMAL):	\
  case _FP_CLS_COMBINE(FP_CLS_NAN,FP_CLS_INF):		\
  case _FP_CLS_COMBINE(FP_CLS_NAN,FP_CLS_ZERO):		\
    R##_s = X##_s;					\
							\
  case _FP_CLS_COMBINE(FP_CLS_INF,FP_CLS_INF):		\
  case _FP_CLS_COMBINE(FP_CLS_INF,FP_CLS_NORMAL):	\
  case _FP_CLS_COMBINE(FP_CLS_ZERO,FP_CLS_NORMAL):	\
  case _FP_CLS_COMBINE(FP_CLS_ZERO,FP_CLS_ZERO):	\
    _FP_FRAC_COPY_##wc(R, X);				\
    R##_c = X##_c;					\
    break;						\
							\
  case _FP_CLS_COMBINE(FP_CLS_NORMAL,FP_CLS_NAN):	\
  case _FP_CLS_COMBINE(FP_CLS_INF,FP_CLS_NAN):		\
  case _FP_CLS_COMBINE(FP_CLS_ZERO,FP_CLS_NAN):		\
    R##_s = Y##_s;					\
							\
  case _FP_CLS_COMBINE(FP_CLS_NORMAL,FP_CLS_INF):	\
  case _FP_CLS_COMBINE(FP_CLS_NORMAL,FP_CLS_ZERO):	\
    _FP_FRAC_COPY_##wc(R, Y);				\
    R##_c = Y##_c;					\
    break;						\
							\
  case _FP_CLS_COMBINE(FP_CLS_INF,FP_CLS_ZERO):		\
  case _FP_CLS_COMBINE(FP_CLS_ZERO,FP_CLS_INF):		\
    R##_c = FP_CLS_NAN;					\
    _FP_FRAC_SET_##wc(R, _FP_NANFRAC_##fs);		\
    break;						\
							\
  default:						\
    abort();						\
  }							\
} while (0)


/*
 * Main division routine.  The input values should be cooked.
 */

#define _FP_DIV(fs, wc, R, X, Y)			\
do {							\
  R##_s = X##_s ^ Y##_s;				\
  switch (_FP_CLS_COMBINE(X##_c, Y##_c))		\
  {							\
  case _FP_CLS_COMBINE(FP_CLS_NORMAL,FP_CLS_NORMAL):	\
    R##_c = FP_CLS_NORMAL;				\
    R##_e = X##_e - Y##_e;				\
							\
    _FP_DIV_MEAT_##fs(R,X,Y);				\
    break;						\
							\
  case _FP_CLS_COMBINE(FP_CLS_NAN,FP_CLS_NAN):		\
    _FP_CHOOSENAN(fs, wc, R, X, Y);			\
    break;						\
							\
  case _FP_CLS_COMBINE(FP_CLS_NAN,FP_CLS_NORMAL):	\
  case _FP_CLS_COMBINE(FP_CLS_NAN,FP_CLS_INF):		\
  case _FP_CLS_COMBINE(FP_CLS_NAN,FP_CLS_ZERO):		\
    R##_s = X##_s;					\
    _FP_FRAC_COPY_##wc(R, X);				\
    R##_c = X##_c;					\
    break;						\
							\
  case _FP_CLS_COMBINE(FP_CLS_NORMAL,FP_CLS_NAN):	\
  case _FP_CLS_COMBINE(FP_CLS_INF,FP_CLS_NAN):		\
  case _FP_CLS_COMBINE(FP_CLS_ZERO,FP_CLS_NAN):		\
    R##_s = Y##_s;					\
    _FP_FRAC_COPY_##wc(R, Y);				\
    R##_c = Y##_c;					\
    break;						\
							\
  case _FP_CLS_COMBINE(FP_CLS_NORMAL,FP_CLS_INF):	\
  case _FP_CLS_COMBINE(FP_CLS_ZERO,FP_CLS_INF):		\
  case _FP_CLS_COMBINE(FP_CLS_ZERO,FP_CLS_NORMAL):	\
    R##_c = FP_CLS_ZERO;				\
    break;						\
							\
  case _FP_CLS_COMBINE(FP_CLS_NORMAL,FP_CLS_ZERO):	\
  case _FP_CLS_COMBINE(FP_CLS_INF,FP_CLS_ZERO):		\
  case _FP_CLS_COMBINE(FP_CLS_INF,FP_CLS_NORMAL):	\
    R##_c = FP_CLS_INF;					\
    break;						\
							\
  case _FP_CLS_COMBINE(FP_CLS_INF,FP_CLS_INF):		\
  case _FP_CLS_COMBINE(FP_CLS_ZERO,FP_CLS_ZERO):	\
    R##_c = FP_CLS_NAN;					\
    _FP_FRAC_SET_##wc(R, _FP_NANFRAC_##fs);		\
    break;						\
							\
  default:						\
    abort();						\
  }							\
} while (0)


/*
 * Main differential comparison routine.  The inputs should be raw not
 * cooked.  The return is -1,0,1 for normal values, 2 otherwise.
 */

#define _FP_CMP(fs, wc, ret, X, Y, un)					\
  do {									\
    /* NANs are unordered */						\
    if ((X##_e == _FP_EXPMAX_##fs && !_FP_FRAC_ZEROP_##wc(X))		\
	|| (Y##_e == _FP_EXPMAX_##fs && !_FP_FRAC_ZEROP_##wc(Y)))	\
      {									\
	ret = un;							\
      }									\
    else								\
      {									\
        int __x_zero = (!X##_e && _FP_FRAC_ZEROP_##wc(X)) ? 1 : 0;	\
        int __y_zero = (!Y##_e && _FP_FRAC_ZEROP_##wc(Y)) ? 1 : 0;	\
									\
	if (__x_zero && __y_zero)					\
	  ret = 0;							\
	else if (__x_zero)						\
	  ret = Y##_s ? 1 : -1;						\
	else if (__y_zero)						\
	  ret = X##_s ? -1 : 1;						\
	else if (X##_s != Y##_s)					\
	  ret = X##_s ? -1 : 1;						\
	else if (X##_e > Y##_e)						\
	  ret = X##_s ? -1 : 1;						\
	else if (X##_e < Y##_e)						\
	  ret = X##_s ? 1 : -1;						\
	else if (_FP_FRAC_GT_##wc(X, Y))				\
	  ret = X##_s ? -1 : 1;						\
	else if (_FP_FRAC_GT_##wc(Y, X))				\
	  ret = X##_s ? 1 : -1;						\
	else								\
	  ret = 0;							\
      }									\
  } while (0)


/* Simplification for strict equality.  */

#define _FP_CMP_EQ(fs, wc, ret, X, Y)					  \
  do {									  \
    /* NANs are unordered */						  \
    if ((X##_e == _FP_EXPMAX_##fs && !_FP_FRAC_ZEROP_##wc(X))		  \
	|| (Y##_e == _FP_EXPMAX_##fs && !_FP_FRAC_ZEROP_##wc(Y)))	  \
      {									  \
	ret = 1;							  \
      }									  \
    else								  \
      {									  \
	ret = !(X##_e == Y##_e						  \
		&& _FP_FRAC_EQ_##wc(X, Y)				  \
		&& (X##_s == Y##_s || !X##_e && _FP_FRAC_ZEROP_##wc(X))); \
      }									  \
  } while (0)

/*
 * Main square root routine.  The input value should be cooked.
 */

#define _FP_SQRT(fs, wc, R, X)						\
do {									\
    _FP_FRAC_DECL_##wc(T); _FP_FRAC_DECL_##wc(S);			\
    _FP_W_TYPE q;							\
    switch (X##_c)							\
    {									\
    case FP_CLS_NAN:							\
    	R##_s = 0;							\
    	R##_c = FP_CLS_NAN;						\
    	_FP_FRAC_SET_##wc(X, _FP_ZEROFRAC_##wc);			\
    	break;								\
    case FP_CLS_INF:							\
    	if (X##_s)							\
    	  {								\
    	    R##_s = 0;							\
	    R##_c = FP_CLS_NAN; /* sNAN */				\
    	  }								\
    	else								\
    	  {								\
    	    R##_s = 0;							\
    	    R##_c = FP_CLS_INF; /* sqrt(+inf) = +inf */			\
    	  }								\
    	break;								\
    case FP_CLS_ZERO:							\
	R##_s = X##_s;							\
    	R##_c = FP_CLS_ZERO; /* sqrt(+-0) = +-0 */			\
	break;								\
    case FP_CLS_NORMAL:							\
    	R##_s = 0;							\
        if (X##_s)							\
          {								\
	    R##_c = FP_CLS_NAN; /* sNAN */				\
	    break;							\
          }								\
    	R##_c = FP_CLS_NORMAL;						\
        if (X##_e & 1)							\
          _FP_FRAC_SLL_##wc(X, 1);					\
        R##_e = X##_e >> 1;						\
        _FP_FRAC_SET_##wc(S, _FP_ZEROFRAC_##wc);			\
        _FP_FRAC_SET_##wc(R, _FP_ZEROFRAC_##wc);			\
        q = _FP_OVERFLOW_##fs;						\
        _FP_FRAC_SLL_##wc(X, 1);					\
        _FP_SQRT_MEAT_##wc(R, S, T, X, q);				\
        _FP_FRAC_SRL_##wc(R, 1);					\
    }									\
  } while (0)

/*
 * Convert from FP to integer
 */

/* "When a NaN, infinity, large positive argument >= 2147483648.0, or
 * large negative argument <= -2147483649.0 is converted to an integer,
 * the invalid_current bit...should be set and fp_exception_IEEE_754 should
 * be raised. If the floating point invalid trap is disabled, no trap occurs
 * and a numerical result is generated: if the sign bit of the operand
 * is 0, the result is 2147483647; if the sign bit of the operand is 1,
 * the result is -2147483648."
 * Similarly for conversion to extended ints, except that the boundaries
 * are >= 2^63, <= -(2^63 + 1), and the results are 2^63 + 1 for s=0 and
 * -2^63 for s=1.
 * -- SPARC Architecture Manual V9, Appendix B, which specifies how
 * SPARCs resolve implementation dependencies in the IEEE-754 spec.
 * I don't believe that the code below follows this. I'm not even sure
 * it's right!
 * It doesn't cope with needing to convert to an n bit integer when there
 * is no n bit integer type. Fortunately gcc provides long long so this
 * isn't a problem for sparc32.
 * I have, however, fixed its NaN handling to conform as above.
 *         -- PMM 02/1998
 * NB: rsigned is not 'is r declared signed?' but 'should the value stored
 * in r be signed or unsigned?'. r is always(?) declared unsigned.
 * Comments below are mine, BTW -- PMM
 */
#define _FP_TO_INT(fs, wc, r, X, rsize, rsigned)			\
  do {									\
    switch (X##_c)							\
      {									\
      case FP_CLS_NORMAL:						\
	if (X##_e < 0)							\
	  {								\
	  /* case FP_CLS_NAN: see above! */				\
	  case FP_CLS_ZERO:						\
	    r = 0;							\
	  }								\
	else if (X##_e >= rsize - (rsigned != 0))			\
	  {	/* overflow */						\
	  case FP_CLS_NAN:                                              \
          case FP_CLS_INF:						\
	    if (rsigned)						\
	      {								\
		r = 1;							\
		r <<= rsize - 1;					\
		r -= 1 - X##_s;						\
	      }								\
	    else							\
	      {								\
		r = 0;							\
		if (!X##_s)						\
		  r = ~r;						\
	      }								\
	  }								\
	else								\
	  {								\
	    if (_FP_W_TYPE_SIZE*wc < rsize)				\
	      {								\
		_FP_FRAC_ASSEMBLE_##wc(r, X, rsize);			\
		r <<= X##_e - _FP_WFRACBITS_##fs;			\
	      }								\
	    else							\
	      {								\
		if (X##_e >= _FP_WFRACBITS_##fs)			\
		  _FP_FRAC_SLL_##wc(X, (X##_e - _FP_WFRACBITS_##fs + 1));\
		else							\
		  _FP_FRAC_SRL_##wc(X, (_FP_WFRACBITS_##fs - X##_e - 1));\
		_FP_FRAC_ASSEMBLE_##wc(r, X, rsize);			\
	      }								\
	    if (rsigned && X##_s)					\
	      r = -r;							\
	  }								\
	break;								\
      }									\
  } while (0)

#define _FP_FROM_INT(fs, wc, X, r, rsize, rtype)			\
  do {									\
    if (r)								\
      {									\
	X##_c = FP_CLS_NORMAL;						\
									\
	if ((X##_s = (r < 0)))						\
	  r = -r;							\
	/* Note that `r' is now considered unsigned, so we don't have	\
	   to worry about the single signed overflow case.  */		\
									\
	if (rsize <= _FP_W_TYPE_SIZE)					\
	  __FP_CLZ(X##_e, r);						\
	else								\
	  __FP_CLZ_2(X##_e, (_FP_W_TYPE)(r >> _FP_W_TYPE_SIZE), 	\
		     (_FP_W_TYPE)r);					\
	if (rsize < _FP_W_TYPE_SIZE)					\
		X##_e -= (_FP_W_TYPE_SIZE - rsize);			\
	X##_e = rsize - X##_e - 1;					\
									\
	if (_FP_FRACBITS_##fs < rsize && _FP_WFRACBITS_##fs < X##_e)	\
	  __FP_FRAC_SRS_1(r, (X##_e - _FP_WFRACBITS_##fs), rsize);	\
	r &= ~((_FP_W_TYPE)1 << X##_e);					\
	_FP_FRAC_DISASSEMBLE_##wc(X, ((unsigned rtype)r), rsize);	\
	_FP_FRAC_SLL_##wc(X, (_FP_WFRACBITS_##fs - X##_e - 1));		\
      }									\
    else								\
      {									\
	X##_c = FP_CLS_ZERO, X##_s = 0;					\
      }									\
  } while (0)


#define FP_CONV(dfs,sfs,dwc,swc,D,S)			\
  do {							\
    _FP_FRAC_CONV_##dwc##_##swc(dfs, sfs, D, S);	\
    D##_e = S##_e;					\
    D##_c = S##_c;					\
    D##_s = S##_s;					\
  } while (0)

/*
 * Helper primitives.
 */

/* Count leading zeros in a word.  */

#ifndef __FP_CLZ
#if _FP_W_TYPE_SIZE < 64
/* this is just to shut the compiler up about shifts > word length -- PMM 02/1998 */
#define __FP_CLZ(r, x)				\
  do {						\
    _FP_W_TYPE _t = (x);			\
    r = _FP_W_TYPE_SIZE - 1;			\
    if (_t > 0xffff) r -= 16;			\
    if (_t > 0xffff) _t >>= 16;			\
    if (_t > 0xff) r -= 8;			\
    if (_t > 0xff) _t >>= 8;			\
    if (_t & 0xf0) r -= 4;			\
    if (_t & 0xf0) _t >>= 4;			\
    if (_t & 0xc) r -= 2;			\
    if (_t & 0xc) _t >>= 2;			\
    if (_t & 0x2) r -= 1;			\
  } while (0)
#else /* not _FP_W_TYPE_SIZE < 64 */
#define __FP_CLZ(r, x)				\
  do {						\
    _FP_W_TYPE _t = (x);			\
    r = _FP_W_TYPE_SIZE - 1;			\
    if (_t > 0xffffffff) r -= 32;		\
    if (_t > 0xffffffff) _t >>= 32;		\
    if (_t > 0xffff) r -= 16;			\
    if (_t > 0xffff) _t >>= 16;			\
    if (_t > 0xff) r -= 8;			\
    if (_t > 0xff) _t >>= 8;			\
    if (_t & 0xf0) r -= 4;			\
    if (_t & 0xf0) _t >>= 4;			\
    if (_t & 0xc) r -= 2;			\
    if (_t & 0xc) _t >>= 2;			\
    if (_t & 0x2) r -= 1;			\
  } while (0)
#endif /* not _FP_W_TYPE_SIZE < 64 */
#endif /* ndef __FP_CLZ */

#define _FP_DIV_HELP_imm(q, r, n, d)		\
  do {						\
    q = n / d, r = n % d;			\
  } while (0)
Commit	Line	Data
1da177e4 LT	1	#define _FP_DECL(wc, X) \
	2	_FP_I_TYPE X##_c, X##_s, X##_e; \
	3	_FP_FRAC_DECL_##wc(X)
	4
	5	/*
	6	* Finish truely unpacking a native fp value by classifying the kind
	7	* of fp value and normalizing both the exponent and the fraction.
	8	*/
	9
	10	#define _FP_UNPACK_CANONICAL(fs, wc, X) \
	11	do { \
	12	switch (X##_e) \
	13	{ \
	14	default: \
	15	_FP_FRAC_HIGH_##wc(X) \|= _FP_IMPLBIT_##fs; \
	16	_FP_FRAC_SLL_##wc(X, _FP_WORKBITS); \
	17	X##_e -= _FP_EXPBIAS_##fs; \
	18	X##_c = FP_CLS_NORMAL; \
	19	break; \
	20	\
	21	case 0: \
	22	if (_FP_FRAC_ZEROP_##wc(X)) \
	23	X##_c = FP_CLS_ZERO; \
	24	else \
	25	{ \
	26	/* a denormalized number */ \
	27	_FP_I_TYPE _shift; \
	28	_FP_FRAC_CLZ_##wc(_shift, X); \
	29	_shift -= _FP_FRACXBITS_##fs; \
	30	_FP_FRAC_SLL_##wc(X, (_shift+_FP_WORKBITS)); \
	31	X##_e -= _FP_EXPBIAS_##fs - 1 + _shift; \
	32	X##_c = FP_CLS_NORMAL; \
	33	} \
	34	break; \
	35	\
	36	case _FP_EXPMAX_##fs: \
	37	if (_FP_FRAC_ZEROP_##wc(X)) \
	38	X##_c = FP_CLS_INF; \
	39	else \
	40	/* we don't differentiate between signaling and quiet nans */ \
	41	X##_c = FP_CLS_NAN; \
	42	break; \
	43	} \
	44	} while (0)
	45
	46
	47	/*
	48	* Before packing the bits back into the native fp result, take care
	49	* of such mundane things as rounding and overflow. Also, for some
	50	* kinds of fp values, the original parts may not have been fully
	51	* extracted -- but that is ok, we can regenerate them now.
	52	*/
	53
	54	#define _FP_PACK_CANONICAL(fs, wc, X) \
	55	({int __ret = 0; \
	56	switch (X##_c) \
	57	{ \
	58	case FP_CLS_NORMAL: \
	59	X##_e += _FP_EXPBIAS_##fs; \
	60	if (X##_e > 0) \
	61	{ \
	62	__ret \|= _FP_ROUND(wc, X); \
	63	if (_FP_FRAC_OVERP_##wc(fs, X)) \
	64	{ \
65	_FP_FRAC_SRL_##wc(X, (_FP_WORKBITS+1)); \
66	X##_e++; \
67	} \
68	else \
69	_FP_FRAC_SRL_##wc(X, _FP_WORKBITS); \
70	if (X##_e >= _FP_EXPMAX_##fs) \
71	{ \
72	/* overflow to infinity */ \
73	X##_e = _FP_EXPMAX_##fs; \
74	_FP_FRAC_SET_##wc(X, _FP_ZEROFRAC_##wc); \
75	__ret \|= EFLAG_OVERFLOW; \
76	} \
77	} \
78	else \
79	{ \
80	/* we've got a denormalized number */ \
81	X##_e = -X##_e + 1; \
82	if (X##_e <= _FP_WFRACBITS_##fs) \
83	{ \
84	_FP_FRAC_SRS_##wc(X, X##_e, _FP_WFRACBITS_##fs); \
85	_FP_FRAC_SLL_##wc(X, 1); \
86	if (_FP_FRAC_OVERP_##wc(fs, X)) \
87	{ \
88	X##_e = 1; \
89	_FP_FRAC_SET_##wc(X, _FP_ZEROFRAC_##wc); \
90	} \
91	else \
92	{ \
93	X##_e = 0; \
94	_FP_FRAC_SRL_##wc(X, _FP_WORKBITS+1); \
95	__ret \|= EFLAG_UNDERFLOW; \
96	} \
97	} \
98	else \
99	{ \
100	/* underflow to zero */ \
101	X##_e = 0; \
102	_FP_FRAC_SET_##wc(X, _FP_ZEROFRAC_##wc); \
103	__ret \|= EFLAG_UNDERFLOW; \
104	} \
105	} \
106	break; \
107	\
108	case FP_CLS_ZERO: \
109	X##_e = 0; \
110	_FP_FRAC_SET_##wc(X, _FP_ZEROFRAC_##wc); \
111	break; \
112	\
113	case FP_CLS_INF: \
114	X##_e = _FP_EXPMAX_##fs; \
115	_FP_FRAC_SET_##wc(X, _FP_ZEROFRAC_##wc); \
116	break; \
117	\
118	case FP_CLS_NAN: \
119	X##_e = _FP_EXPMAX_##fs; \
120	if (!_FP_KEEPNANFRACP) \
121	{ \
122	_FP_FRAC_SET_##wc(X, _FP_NANFRAC_##fs); \
123	X##_s = 0; \
124	} \
125	else \
126	_FP_FRAC_HIGH_##wc(X) \|= _FP_QNANBIT_##fs; \
127	break; \
128	} \
129	__ret; \
130	})
131
132
133	/*
134	* Main addition routine. The input values should be cooked.
135	*/
136
137	#define _FP_ADD(fs, wc, R, X, Y) \
138	do { \
139	switch (_FP_CLS_COMBINE(X##_c, Y##_c)) \
140	{ \
141	case _FP_CLS_COMBINE(FP_CLS_NORMAL,FP_CLS_NORMAL): \
142	{ \
143	/* shift the smaller number so that its exponent matches the larger */ \
144	_FP_I_TYPE diff = X##_e - Y##_e; \
145	\
146	if (diff < 0) \
147	{ \
148	diff = -diff; \
149	if (diff <= _FP_WFRACBITS_##fs) \
150	_FP_FRAC_SRS_##wc(X, diff, _FP_WFRACBITS_##fs); \
151	else if (!_FP_FRAC_ZEROP_##wc(X)) \
152	_FP_FRAC_SET_##wc(X, _FP_MINFRAC_##wc); \
153	else \
154	_FP_FRAC_SET_##wc(X, _FP_ZEROFRAC_##wc); \
155	R##_e = Y##_e; \
156	} \
157	else \
158	{ \
159	if (diff > 0) \
160	{ \
161	if (diff <= _FP_WFRACBITS_##fs) \
162	_FP_FRAC_SRS_##wc(Y, diff, _FP_WFRACBITS_##fs); \
163	else if (!_FP_FRAC_ZEROP_##wc(Y)) \
164	_FP_FRAC_SET_##wc(Y, _FP_MINFRAC_##wc); \
165	else \
166	_FP_FRAC_SET_##wc(Y, _FP_ZEROFRAC_##wc); \
167	} \
168	R##_e = X##_e; \
169	} \
170	\
171	R##_c = FP_CLS_NORMAL; \
172	\
173	if (X##_s == Y##_s) \
174	{ \
175	R##_s = X##_s; \
176	_FP_FRAC_ADD_##wc(R, X, Y); \
177	if (_FP_FRAC_OVERP_##wc(fs, R)) \
178	{ \
179	_FP_FRAC_SRS_##wc(R, 1, _FP_WFRACBITS_##fs); \
180	R##_e++; \
181	} \
182	} \
183	else \
184	{ \
185	R##_s = X##_s; \
186	_FP_FRAC_SUB_##wc(R, X, Y); \
187	if (_FP_FRAC_ZEROP_##wc(R)) \
188	{ \
189	/* return an exact zero */ \
190	if (FP_ROUNDMODE == FP_RND_MINF) \
191	R##_s \|= Y##_s; \
192	else \
193	R##_s &= Y##_s; \
194	R##_c = FP_CLS_ZERO; \
195	} \
196	else \
197	{ \
198	if (_FP_FRAC_NEGP_##wc(R)) \
199	{ \
200	_FP_FRAC_SUB_##wc(R, Y, X); \
201	R##_s = Y##_s; \
202	} \
203	\
204	/* renormalize after subtraction */ \
205	_FP_FRAC_CLZ_##wc(diff, R); \
206	diff -= _FP_WFRACXBITS_##fs; \
207	if (diff) \
208	{ \
209	R##_e -= diff; \
210	_FP_FRAC_SLL_##wc(R, diff); \
211	} \
212	} \
213	} \
214	break; \
215	} \
216	\
217	case _FP_CLS_COMBINE(FP_CLS_NAN,FP_CLS_NAN): \
218	_FP_CHOOSENAN(fs, wc, R, X, Y); \
219	break; \
220	\
221	case _FP_CLS_COMBINE(FP_CLS_NORMAL,FP_CLS_ZERO): \
222	R##_e = X##_e; \
223	case _FP_CLS_COMBINE(FP_CLS_NAN,FP_CLS_NORMAL): \
224	case _FP_CLS_COMBINE(FP_CLS_NAN,FP_CLS_INF): \
225	case _FP_CLS_COMBINE(FP_CLS_NAN,FP_CLS_ZERO): \
226	_FP_FRAC_COPY_##wc(R, X); \
227	R##_s = X##_s; \
228	R##_c = X##_c; \
229	break; \
230	\
231	case _FP_CLS_COMBINE(FP_CLS_ZERO,FP_CLS_NORMAL): \
232	R##_e = Y##_e; \
233	case _FP_CLS_COMBINE(FP_CLS_NORMAL,FP_CLS_NAN): \
234	case _FP_CLS_COMBINE(FP_CLS_INF,FP_CLS_NAN): \
235	case _FP_CLS_COMBINE(FP_CLS_ZERO,FP_CLS_NAN): \
236	_FP_FRAC_COPY_##wc(R, Y); \
237	R##_s = Y##_s; \
238	R##_c = Y##_c; \
239	break; \
240	\
241	case _FP_CLS_COMBINE(FP_CLS_INF,FP_CLS_INF): \
242	if (X##_s != Y##_s) \
243	{ \
244	/* +INF + -INF => NAN */ \
245	_FP_FRAC_SET_##wc(R, _FP_NANFRAC_##fs); \
246	R##_s = X##_s ^ Y##_s; \
247	R##_c = FP_CLS_NAN; \
248	break; \
249	} \
250	/* FALLTHRU */ \
251	\
252	case _FP_CLS_COMBINE(FP_CLS_INF,FP_CLS_NORMAL): \
253	case _FP_CLS_COMBINE(FP_CLS_INF,FP_CLS_ZERO): \
254	R##_s = X##_s; \
255	R##_c = FP_CLS_INF; \
256	break; \
257	\
258	case _FP_CLS_COMBINE(FP_CLS_NORMAL,FP_CLS_INF): \
259	case _FP_CLS_COMBINE(FP_CLS_ZERO,FP_CLS_INF): \
260	R##_s = Y##_s; \
261	R##_c = FP_CLS_INF; \
262	break; \
263	\
264	case _FP_CLS_COMBINE(FP_CLS_ZERO,FP_CLS_ZERO): \
265	/* make sure the sign is correct */ \
266	if (FP_ROUNDMODE == FP_RND_MINF) \
267	R##_s = X##_s \| Y##_s; \
268	else \
269	R##_s = X##_s & Y##_s; \
270	R##_c = FP_CLS_ZERO; \
271	break; \
272	\
273	default: \
274	abort(); \
275	} \
276	} while (0)
277
278
279	/*
280	* Main negation routine. FIXME -- when we care about setting exception
281	* bits reliably, this will not do. We should examine all of the fp classes.
282	*/
283
284	#define _FP_NEG(fs, wc, R, X) \
285	do { \
286	_FP_FRAC_COPY_##wc(R, X); \
287	R##_c = X##_c; \
288	R##_e = X##_e; \
289	R##_s = 1 ^ X##_s; \
290	} while (0)
291
292
293	/*
294	* Main multiplication routine. The input values should be cooked.
295	*/
296
297	#define _FP_MUL(fs, wc, R, X, Y) \
298	do { \
299	R##_s = X##_s ^ Y##_s; \
300	switch (_FP_CLS_COMBINE(X##_c, Y##_c)) \
301	{ \
302	case _FP_CLS_COMBINE(FP_CLS_NORMAL,FP_CLS_NORMAL): \
303	R##_c = FP_CLS_NORMAL; \
304	R##_e = X##_e + Y##_e + 1; \
305	\
306	_FP_MUL_MEAT_##fs(R,X,Y); \
307	\
308	if (_FP_FRAC_OVERP_##wc(fs, R)) \
309	_FP_FRAC_SRS_##wc(R, 1, _FP_WFRACBITS_##fs); \
310	else \
311	R##_e--; \
312	break; \
313	\
314	case _FP_CLS_COMBINE(FP_CLS_NAN,FP_CLS_NAN): \
315	_FP_CHOOSENAN(fs, wc, R, X, Y); \
316	break; \
317	\
318	case _FP_CLS_COMBINE(FP_CLS_NAN,FP_CLS_NORMAL): \
319	case _FP_CLS_COMBINE(FP_CLS_NAN,FP_CLS_INF): \
320	case _FP_CLS_COMBINE(FP_CLS_NAN,FP_CLS_ZERO): \
321	R##_s = X##_s; \
322	\
323	case _FP_CLS_COMBINE(FP_CLS_INF,FP_CLS_INF): \
324	case _FP_CLS_COMBINE(FP_CLS_INF,FP_CLS_NORMAL): \
325	case _FP_CLS_COMBINE(FP_CLS_ZERO,FP_CLS_NORMAL): \
326	case _FP_CLS_COMBINE(FP_CLS_ZERO,FP_CLS_ZERO): \
327	_FP_FRAC_COPY_##wc(R, X); \
328	R##_c = X##_c; \
329	break; \
330	\
331	case _FP_CLS_COMBINE(FP_CLS_NORMAL,FP_CLS_NAN): \
332	case _FP_CLS_COMBINE(FP_CLS_INF,FP_CLS_NAN): \
333	case _FP_CLS_COMBINE(FP_CLS_ZERO,FP_CLS_NAN): \
334	R##_s = Y##_s; \
335	\
336	case _FP_CLS_COMBINE(FP_CLS_NORMAL,FP_CLS_INF): \
337	case _FP_CLS_COMBINE(FP_CLS_NORMAL,FP_CLS_ZERO): \
338	_FP_FRAC_COPY_##wc(R, Y); \
339	R##_c = Y##_c; \
340	break; \
341	\
342	case _FP_CLS_COMBINE(FP_CLS_INF,FP_CLS_ZERO): \
343	case _FP_CLS_COMBINE(FP_CLS_ZERO,FP_CLS_INF): \
344	R##_c = FP_CLS_NAN; \
345	_FP_FRAC_SET_##wc(R, _FP_NANFRAC_##fs); \
346	break; \
347	\
348	default: \
349	abort(); \
350	} \
351	} while (0)
352
353
354	/*
355	* Main division routine. The input values should be cooked.
356	*/
357
358	#define _FP_DIV(fs, wc, R, X, Y) \
359	do { \
360	R##_s = X##_s ^ Y##_s; \
361	switch (_FP_CLS_COMBINE(X##_c, Y##_c)) \
362	{ \
363	case _FP_CLS_COMBINE(FP_CLS_NORMAL,FP_CLS_NORMAL): \
364	R##_c = FP_CLS_NORMAL; \
365	R##_e = X##_e - Y##_e; \
366	\
367	_FP_DIV_MEAT_##fs(R,X,Y); \
368	break; \
369	\
370	case _FP_CLS_COMBINE(FP_CLS_NAN,FP_CLS_NAN): \
371	_FP_CHOOSENAN(fs, wc, R, X, Y); \
372	break; \
373	\
374	case _FP_CLS_COMBINE(FP_CLS_NAN,FP_CLS_NORMAL): \
375	case _FP_CLS_COMBINE(FP_CLS_NAN,FP_CLS_INF): \
376	case _FP_CLS_COMBINE(FP_CLS_NAN,FP_CLS_ZERO): \
377	R##_s = X##_s; \
378	_FP_FRAC_COPY_##wc(R, X); \
379	R##_c = X##_c; \
380	break; \
381	\
382	case _FP_CLS_COMBINE(FP_CLS_NORMAL,FP_CLS_NAN): \
383	case _FP_CLS_COMBINE(FP_CLS_INF,FP_CLS_NAN): \
384	case _FP_CLS_COMBINE(FP_CLS_ZERO,FP_CLS_NAN): \
385	R##_s = Y##_s; \
386	_FP_FRAC_COPY_##wc(R, Y); \
387	R##_c = Y##_c; \
388	break; \
389	\
390	case _FP_CLS_COMBINE(FP_CLS_NORMAL,FP_CLS_INF): \
391	case _FP_CLS_COMBINE(FP_CLS_ZERO,FP_CLS_INF): \
392	case _FP_CLS_COMBINE(FP_CLS_ZERO,FP_CLS_NORMAL): \
393	R##_c = FP_CLS_ZERO; \
394	break; \
395	\
396	case _FP_CLS_COMBINE(FP_CLS_NORMAL,FP_CLS_ZERO): \
397	case _FP_CLS_COMBINE(FP_CLS_INF,FP_CLS_ZERO): \
398	case _FP_CLS_COMBINE(FP_CLS_INF,FP_CLS_NORMAL): \
399	R##_c = FP_CLS_INF; \
400	break; \
401	\
402	case _FP_CLS_COMBINE(FP_CLS_INF,FP_CLS_INF): \
403	case _FP_CLS_COMBINE(FP_CLS_ZERO,FP_CLS_ZERO): \
404	R##_c = FP_CLS_NAN; \
405	_FP_FRAC_SET_##wc(R, _FP_NANFRAC_##fs); \
406	break; \
407	\
408	default: \
409	abort(); \
410	} \
411	} while (0)
412
413
414	/*
415	* Main differential comparison routine. The inputs should be raw not
416	* cooked. The return is -1,0,1 for normal values, 2 otherwise.
417	*/
418
419	#define _FP_CMP(fs, wc, ret, X, Y, un) \
420	do { \
421	/* NANs are unordered */ \
422	if ((X##_e == _FP_EXPMAX_##fs && !_FP_FRAC_ZEROP_##wc(X)) \
423	\|\| (Y##_e == _FP_EXPMAX_##fs && !_FP_FRAC_ZEROP_##wc(Y))) \
424	{ \
425	ret = un; \
426	} \
427	else \
428	{ \
429	int __x_zero = (!X##_e && _FP_FRAC_ZEROP_##wc(X)) ? 1 : 0; \
430	int __y_zero = (!Y##_e && _FP_FRAC_ZEROP_##wc(Y)) ? 1 : 0; \
431	\
432	if (__x_zero && __y_zero) \
433	ret = 0; \
434	else if (__x_zero) \
435	ret = Y##_s ? 1 : -1; \
436	else if (__y_zero) \
437	ret = X##_s ? -1 : 1; \
438	else if (X##_s != Y##_s) \
439	ret = X##_s ? -1 : 1; \
440	else if (X##_e > Y##_e) \
441	ret = X##_s ? -1 : 1; \
442	else if (X##_e < Y##_e) \
443	ret = X##_s ? 1 : -1; \
444	else if (_FP_FRAC_GT_##wc(X, Y)) \
445	ret = X##_s ? -1 : 1; \
446	else if (_FP_FRAC_GT_##wc(Y, X)) \
447	ret = X##_s ? 1 : -1; \
448	else \
449	ret = 0; \
450	} \
451	} while (0)
452
453
454	/* Simplification for strict equality. */
455
456	#define _FP_CMP_EQ(fs, wc, ret, X, Y) \
457	do { \
458	/* NANs are unordered */ \
459	if ((X##_e == _FP_EXPMAX_##fs && !_FP_FRAC_ZEROP_##wc(X)) \
460	\|\| (Y##_e == _FP_EXPMAX_##fs && !_FP_FRAC_ZEROP_##wc(Y))) \
461	{ \
462	ret = 1; \
463	} \
464	else \
465	{ \
466	ret = !(X##_e == Y##_e \
467	&& _FP_FRAC_EQ_##wc(X, Y) \
468	&& (X##_s == Y##_s \|\| !X##_e && _FP_FRAC_ZEROP_##wc(X))); \
469	} \
470	} while (0)
471
472	/*
473	* Main square root routine. The input value should be cooked.
474	*/
475
476	#define _FP_SQRT(fs, wc, R, X) \
477	do { \
478	_FP_FRAC_DECL_##wc(T); _FP_FRAC_DECL_##wc(S); \
479	_FP_W_TYPE q; \
480	switch (X##_c) \
481	{ \
482	case FP_CLS_NAN: \
483	R##_s = 0; \
484	R##_c = FP_CLS_NAN; \
485	_FP_FRAC_SET_##wc(X, _FP_ZEROFRAC_##wc); \
486	break; \
487	case FP_CLS_INF: \
488	if (X##_s) \
489	{ \
490	R##_s = 0; \
491	R##_c = FP_CLS_NAN; /* sNAN */ \
492	} \
493	else \
494	{ \
495	R##_s = 0; \
496	R##_c = FP_CLS_INF; /* sqrt(+inf) = +inf */ \
497	} \
498	break; \
499	case FP_CLS_ZERO: \
500	R##_s = X##_s; \
501	R##_c = FP_CLS_ZERO; /* sqrt(+-0) = +-0 */ \
502	break; \
503	case FP_CLS_NORMAL: \
504	R##_s = 0; \
505	if (X##_s) \
506	{ \
507	R##_c = FP_CLS_NAN; /* sNAN */ \
508	break; \
509	} \
510	R##_c = FP_CLS_NORMAL; \
511	if (X##_e & 1) \
512	_FP_FRAC_SLL_##wc(X, 1); \
513	R##_e = X##_e >> 1; \
514	_FP_FRAC_SET_##wc(S, _FP_ZEROFRAC_##wc); \
515	_FP_FRAC_SET_##wc(R, _FP_ZEROFRAC_##wc); \
516	q = _FP_OVERFLOW_##fs; \
517	_FP_FRAC_SLL_##wc(X, 1); \
518	_FP_SQRT_MEAT_##wc(R, S, T, X, q); \
519	_FP_FRAC_SRL_##wc(R, 1); \
520	} \
521	} while (0)
522
523	/*
524	* Convert from FP to integer
525	*/
526
527	/* "When a NaN, infinity, large positive argument >= 2147483648.0, or
528	* large negative argument <= -2147483649.0 is converted to an integer,
529	* the invalid_current bit...should be set and fp_exception_IEEE_754 should
530	* be raised. If the floating point invalid trap is disabled, no trap occurs
531	* and a numerical result is generated: if the sign bit of the operand
532	* is 0, the result is 2147483647; if the sign bit of the operand is 1,
533	* the result is -2147483648."
534	* Similarly for conversion to extended ints, except that the boundaries
535	* are >= 2^63, <= -(2^63 + 1), and the results are 2^63 + 1 for s=0 and
536	* -2^63 for s=1.
537	* -- SPARC Architecture Manual V9, Appendix B, which specifies how
538	* SPARCs resolve implementation dependencies in the IEEE-754 spec.
539	* I don't believe that the code below follows this. I'm not even sure
540	* it's right!
541	* It doesn't cope with needing to convert to an n bit integer when there
542	* is no n bit integer type. Fortunately gcc provides long long so this
543	* isn't a problem for sparc32.
544	* I have, however, fixed its NaN handling to conform as above.
545	* -- PMM 02/1998
546	* NB: rsigned is not 'is r declared signed?' but 'should the value stored
547	* in r be signed or unsigned?'. r is always(?) declared unsigned.
548	* Comments below are mine, BTW -- PMM
549	*/
550	#define _FP_TO_INT(fs, wc, r, X, rsize, rsigned) \
551	do { \
552	switch (X##_c) \
553	{ \
554	case FP_CLS_NORMAL: \
555	if (X##_e < 0) \
556	{ \
557	/* case FP_CLS_NAN: see above! */ \
558	case FP_CLS_ZERO: \
559	r = 0; \
560	} \
561	else if (X##_e >= rsize - (rsigned != 0)) \
562	{ /* overflow */ \
563	case FP_CLS_NAN: \
564	case FP_CLS_INF: \
565	if (rsigned) \
566	{ \
567	r = 1; \
568	r <<= rsize - 1; \
569	r -= 1 - X##_s; \
570	} \
571	else \
572	{ \
573	r = 0; \
574	if (!X##_s) \
575	r = ~r; \
576	} \
577	} \
578	else \
579	{ \
580	if (_FP_W_TYPE_SIZE*wc < rsize) \
581	{ \
582	_FP_FRAC_ASSEMBLE_##wc(r, X, rsize); \
583	r <<= X##_e - _FP_WFRACBITS_##fs; \
584	} \
585	else \
586	{ \
587	if (X##_e >= _FP_WFRACBITS_##fs) \
588	_FP_FRAC_SLL_##wc(X, (X##_e - _FP_WFRACBITS_##fs + 1));\
589	else \
590	_FP_FRAC_SRL_##wc(X, (_FP_WFRACBITS_##fs - X##_e - 1));\
591	_FP_FRAC_ASSEMBLE_##wc(r, X, rsize); \
592	} \
593	if (rsigned && X##_s) \
594	r = -r; \
595	} \
596	break; \
597	} \
598	} while (0)
599
600	#define _FP_FROM_INT(fs, wc, X, r, rsize, rtype) \
601	do { \
602	if (r) \
603	{ \
604	X##_c = FP_CLS_NORMAL; \
605	\
606	if ((X##_s = (r < 0))) \
607	r = -r; \
608	/* Note that `r' is now considered unsigned, so we don't have \
609	to worry about the single signed overflow case. */ \
610	\
611	if (rsize <= _FP_W_TYPE_SIZE) \
612	__FP_CLZ(X##_e, r); \
613	else \
614	__FP_CLZ_2(X##_e, (_FP_W_TYPE)(r >> _FP_W_TYPE_SIZE), \
615	(_FP_W_TYPE)r); \
616	if (rsize < _FP_W_TYPE_SIZE) \
617	X##_e -= (_FP_W_TYPE_SIZE - rsize); \
618	X##_e = rsize - X##_e - 1; \
619	\
620	if (_FP_FRACBITS_##fs < rsize && _FP_WFRACBITS_##fs < X##_e) \
621	__FP_FRAC_SRS_1(r, (X##_e - _FP_WFRACBITS_##fs), rsize); \
622	r &= ~((_FP_W_TYPE)1 << X##_e); \
623	_FP_FRAC_DISASSEMBLE_##wc(X, ((unsigned rtype)r), rsize); \
624	_FP_FRAC_SLL_##wc(X, (_FP_WFRACBITS_##fs - X##_e - 1)); \
625	} \
626	else \
627	{ \
628	X##_c = FP_CLS_ZERO, X##_s = 0; \
629	} \
630	} while (0)
631
632
633	#define FP_CONV(dfs,sfs,dwc,swc,D,S) \
634	do { \
635	_FP_FRAC_CONV_##dwc##_##swc(dfs, sfs, D, S); \
636	D##_e = S##_e; \
637	D##_c = S##_c; \
638	D##_s = S##_s; \
639	} while (0)
640
641	/*
642	* Helper primitives.
643	*/
644
645	/* Count leading zeros in a word. */
646
647	#ifndef __FP_CLZ
648	#if _FP_W_TYPE_SIZE < 64
649	/* this is just to shut the compiler up about shifts > word length -- PMM 02/1998 */
650	#define __FP_CLZ(r, x) \
651	do { \
652	_FP_W_TYPE _t = (x); \
653	r = _FP_W_TYPE_SIZE - 1; \
654	if (_t > 0xffff) r -= 16; \
655	if (_t > 0xffff) _t >>= 16; \
656	if (_t > 0xff) r -= 8; \
657	if (_t > 0xff) _t >>= 8; \
658	if (_t & 0xf0) r -= 4; \
659	if (_t & 0xf0) _t >>= 4; \
660	if (_t & 0xc) r -= 2; \
661	if (_t & 0xc) _t >>= 2; \
662	if (_t & 0x2) r -= 1; \
663	} while (0)
664	#else /* not _FP_W_TYPE_SIZE < 64 */
665	#define __FP_CLZ(r, x) \
666	do { \
667	_FP_W_TYPE _t = (x); \
668	r = _FP_W_TYPE_SIZE - 1; \
669	if (_t > 0xffffffff) r -= 32; \
670	if (_t > 0xffffffff) _t >>= 32; \
671	if (_t > 0xffff) r -= 16; \
672	if (_t > 0xffff) _t >>= 16; \
673	if (_t > 0xff) r -= 8; \
674	if (_t > 0xff) _t >>= 8; \
675	if (_t & 0xf0) r -= 4; \
676	if (_t & 0xf0) _t >>= 4; \
677	if (_t & 0xc) r -= 2; \
678	if (_t & 0xc) _t >>= 2; \
679	if (_t & 0x2) r -= 1; \
680	} while (0)
681	#endif /* not _FP_W_TYPE_SIZE < 64 */
682	#endif /* ndef __FP_CLZ */
683
684	#define _FP_DIV_HELP_imm(q, r, n, d) \
685	do { \
686	q = n / d, r = n % d; \
687	} while (0)
688