[mirror_qemu.git] / fpu / softfloat-parts.c.inc

/*
 * QEMU float support
 *
 * The code in this source file is derived from release 2a of the SoftFloat
 * IEC/IEEE Floating-point Arithmetic Package. Those parts of the code (and
 * some later contributions) are provided under that license, as detailed below.
 * It has subsequently been modified by contributors to the QEMU Project,
 * so some portions are provided under:
 *  the SoftFloat-2a license
 *  the BSD license
 *  GPL-v2-or-later
 *
 * Any future contributions to this file after December 1st 2014 will be
 * taken to be licensed under the Softfloat-2a license unless specifically
 * indicated otherwise.
 */

static void partsN(return_nan)(FloatPartsN *a, float_status *s)
{
    switch (a->cls) {
    case float_class_snan:
        float_raise(float_flag_invalid, s);
        if (s->default_nan_mode) {
            parts_default_nan(a, s);
        } else {
            parts_silence_nan(a, s);
        }
        break;
    case float_class_qnan:
        if (s->default_nan_mode) {
            parts_default_nan(a, s);
        }
        break;
    default:
        g_assert_not_reached();
    }
}

static FloatPartsN *partsN(pick_nan)(FloatPartsN *a, FloatPartsN *b,
                                     float_status *s)
{
    if (is_snan(a->cls) || is_snan(b->cls)) {
        float_raise(float_flag_invalid, s);
    }

    if (s->default_nan_mode) {
        parts_default_nan(a, s);
    } else {
        int cmp = frac_cmp(a, b);
        if (cmp == 0) {
            cmp = a->sign < b->sign;
        }

        if (pickNaN(a->cls, b->cls, cmp > 0, s)) {
            a = b;
        }
        if (is_snan(a->cls)) {
            parts_silence_nan(a, s);
        }
    }
    return a;
}

static FloatPartsN *partsN(pick_nan_muladd)(FloatPartsN *a, FloatPartsN *b,
                                            FloatPartsN *c, float_status *s,
                                            int ab_mask, int abc_mask)
{
    int which;

    if (unlikely(abc_mask & float_cmask_snan)) {
        float_raise(float_flag_invalid, s);
    }

    which = pickNaNMulAdd(a->cls, b->cls, c->cls,
                          ab_mask == float_cmask_infzero, s);

    if (s->default_nan_mode || which == 3) {
        /*
         * Note that this check is after pickNaNMulAdd so that function
         * has an opportunity to set the Invalid flag for infzero.
         */
        parts_default_nan(a, s);
        return a;
    }

    switch (which) {
    case 0:
        break;
    case 1:
        a = b;
        break;
    case 2:
        a = c;
        break;
    default:
        g_assert_not_reached();
    }
    if (is_snan(a->cls)) {
        parts_silence_nan(a, s);
    }
    return a;
}

/*
 * Canonicalize the FloatParts structure.  Determine the class,
 * unbias the exponent, and normalize the fraction.
 */
static void partsN(canonicalize)(FloatPartsN *p, float_status *status,
                                 const FloatFmt *fmt)
{
    if (unlikely(p->exp == 0)) {
        if (likely(frac_eqz(p))) {
            p->cls = float_class_zero;
        } else if (status->flush_inputs_to_zero) {
            float_raise(float_flag_input_denormal, status);
            p->cls = float_class_zero;
            frac_clear(p);
        } else {
            int shift = frac_normalize(p);
            p->cls = float_class_normal;
            p->exp = fmt->frac_shift - fmt->exp_bias - shift + 1;
        }
    } else if (likely(p->exp < fmt->exp_max) || fmt->arm_althp) {
        p->cls = float_class_normal;
        p->exp -= fmt->exp_bias;
        frac_shl(p, fmt->frac_shift);
        p->frac_hi |= DECOMPOSED_IMPLICIT_BIT;
    } else if (likely(frac_eqz(p))) {
        p->cls = float_class_inf;
    } else {
        frac_shl(p, fmt->frac_shift);
        p->cls = (parts_is_snan_frac(p->frac_hi, status)
                  ? float_class_snan : float_class_qnan);
    }
}

/*
 * Round and uncanonicalize a floating-point number by parts. There
 * are FRAC_SHIFT bits that may require rounding at the bottom of the
 * fraction; these bits will be removed. The exponent will be biased
 * by EXP_BIAS and must be bounded by [EXP_MAX-1, 0].
 */
static void partsN(uncanon)(FloatPartsN *p, float_status *s,
                            const FloatFmt *fmt)
{
    const int exp_max = fmt->exp_max;
    const int frac_shift = fmt->frac_shift;
    const uint64_t frac_lsb = fmt->frac_lsb;
    const uint64_t frac_lsbm1 = fmt->frac_lsbm1;
    const uint64_t round_mask = fmt->round_mask;
    const uint64_t roundeven_mask = fmt->roundeven_mask;
    uint64_t inc;
    bool overflow_norm;
    int exp, flags = 0;

    if (unlikely(p->cls != float_class_normal)) {
        switch (p->cls) {
        case float_class_zero:
            p->exp = 0;
            frac_clear(p);
            return;
        case float_class_inf:
            g_assert(!fmt->arm_althp);
            p->exp = fmt->exp_max;
            frac_clear(p);
            return;
        case float_class_qnan:
        case float_class_snan:
            g_assert(!fmt->arm_althp);
            p->exp = fmt->exp_max;
            frac_shr(p, fmt->frac_shift);
            return;
        default:
            break;
        }
        g_assert_not_reached();
    }

    switch (s->float_rounding_mode) {
    case float_round_nearest_even:
        overflow_norm = false;
        inc = ((p->frac_lo & roundeven_mask) != frac_lsbm1 ? frac_lsbm1 : 0);
        break;
    case float_round_ties_away:
        overflow_norm = false;
        inc = frac_lsbm1;
        break;
    case float_round_to_zero:
        overflow_norm = true;
        inc = 0;
        break;
    case float_round_up:
        inc = p->sign ? 0 : round_mask;
        overflow_norm = p->sign;
        break;
    case float_round_down:
        inc = p->sign ? round_mask : 0;
        overflow_norm = !p->sign;
        break;
    case float_round_to_odd:
        overflow_norm = true;
        inc = p->frac_lo & frac_lsb ? 0 : round_mask;
        break;
    default:
        g_assert_not_reached();
    }

    exp = p->exp + fmt->exp_bias;
    if (likely(exp > 0)) {
        if (p->frac_lo & round_mask) {
            flags |= float_flag_inexact;
            if (frac_addi(p, p, inc)) {
                frac_shr(p, 1);
                p->frac_hi |= DECOMPOSED_IMPLICIT_BIT;
                exp++;
            }
        }
        frac_shr(p, frac_shift);

        if (fmt->arm_althp) {
            /* ARM Alt HP eschews Inf and NaN for a wider exponent.  */
            if (unlikely(exp > exp_max)) {
                /* Overflow.  Return the maximum normal.  */
                flags = float_flag_invalid;
                exp = exp_max;
                frac_allones(p);
            }
        } else if (unlikely(exp >= exp_max)) {
            flags |= float_flag_overflow | float_flag_inexact;
            if (overflow_norm) {
                exp = exp_max - 1;
                frac_allones(p);
            } else {
                p->cls = float_class_inf;
                exp = exp_max;
                frac_clear(p);
            }
        }
    } else if (s->flush_to_zero) {
        flags |= float_flag_output_denormal;
        p->cls = float_class_zero;
        exp = 0;
        frac_clear(p);
    } else {
        bool is_tiny = s->tininess_before_rounding || exp < 0;

        if (!is_tiny) {
            FloatPartsN discard;
            is_tiny = !frac_addi(&discard, p, inc);
        }

        frac_shrjam(p, 1 - exp);

        if (p->frac_lo & round_mask) {
            /* Need to recompute round-to-even/round-to-odd. */
            switch (s->float_rounding_mode) {
            case float_round_nearest_even:
                inc = ((p->frac_lo & roundeven_mask) != frac_lsbm1
                       ? frac_lsbm1 : 0);
                break;
            case float_round_to_odd:
                inc = p->frac_lo & frac_lsb ? 0 : round_mask;
                break;
            default:
                break;
            }
            flags |= float_flag_inexact;
            frac_addi(p, p, inc);
        }

        exp = (p->frac_hi & DECOMPOSED_IMPLICIT_BIT) != 0;
        frac_shr(p, frac_shift);

        if (is_tiny && (flags & float_flag_inexact)) {
            flags |= float_flag_underflow;
        }
        if (exp == 0 && frac_eqz(p)) {
            p->cls = float_class_zero;
        }
    }
    p->exp = exp;
    float_raise(flags, s);
}

/*
 * Returns the result of adding or subtracting the values of the
 * floating-point values `a' and `b'. The operation is performed
 * according to the IEC/IEEE Standard for Binary Floating-Point
 * Arithmetic.
 */
static FloatPartsN *partsN(addsub)(FloatPartsN *a, FloatPartsN *b,
                                   float_status *s, bool subtract)
{
    bool b_sign = b->sign ^ subtract;
    int ab_mask = float_cmask(a->cls) | float_cmask(b->cls);

    if (a->sign != b_sign) {
        /* Subtraction */
        if (likely(ab_mask == float_cmask_normal)) {
            if (parts_sub_normal(a, b)) {
                return a;
            }
            /* Subtract was exact, fall through to set sign. */
            ab_mask = float_cmask_zero;
        }

        if (ab_mask == float_cmask_zero) {
            a->sign = s->float_rounding_mode == float_round_down;
            return a;
        }

        if (unlikely(ab_mask & float_cmask_anynan)) {
            goto p_nan;
        }

        if (ab_mask & float_cmask_inf) {
            if (a->cls != float_class_inf) {
                /* N - Inf */
                goto return_b;
            }
            if (b->cls != float_class_inf) {
                /* Inf - N */
                return a;
            }
            /* Inf - Inf */
            float_raise(float_flag_invalid, s);
            parts_default_nan(a, s);
            return a;
        }
    } else {
        /* Addition */
        if (likely(ab_mask == float_cmask_normal)) {
            parts_add_normal(a, b);
            return a;
        }

        if (ab_mask == float_cmask_zero) {
            return a;
        }

        if (unlikely(ab_mask & float_cmask_anynan)) {
            goto p_nan;
        }

        if (ab_mask & float_cmask_inf) {
            a->cls = float_class_inf;
            return a;
        }
    }

    if (b->cls == float_class_zero) {
        g_assert(a->cls == float_class_normal);
        return a;
    }

    g_assert(a->cls == float_class_zero);
    g_assert(b->cls == float_class_normal);
 return_b:
    b->sign = b_sign;
    return b;

 p_nan:
    return parts_pick_nan(a, b, s);
}

/*
 * Returns the result of multiplying the floating-point values `a' and
 * `b'. The operation is performed according to the IEC/IEEE Standard
 * for Binary Floating-Point Arithmetic.
 */
static FloatPartsN *partsN(mul)(FloatPartsN *a, FloatPartsN *b,
                                float_status *s)
{
    int ab_mask = float_cmask(a->cls) | float_cmask(b->cls);
    bool sign = a->sign ^ b->sign;

    if (likely(ab_mask == float_cmask_normal)) {
        FloatPartsW tmp;

        frac_mulw(&tmp, a, b);
        frac_truncjam(a, &tmp);

        a->exp += b->exp + 1;
        if (!(a->frac_hi & DECOMPOSED_IMPLICIT_BIT)) {
            frac_add(a, a, a);
            a->exp -= 1;
        }

        a->sign = sign;
        return a;
    }

    /* Inf * Zero == NaN */
    if (unlikely(ab_mask == float_cmask_infzero)) {
        float_raise(float_flag_invalid, s);
        parts_default_nan(a, s);
        return a;
    }

    if (unlikely(ab_mask & float_cmask_anynan)) {
        return parts_pick_nan(a, b, s);
    }

    /* Multiply by 0 or Inf */
    if (ab_mask & float_cmask_inf) {
        a->cls = float_class_inf;
        a->sign = sign;
        return a;
    }

    g_assert(ab_mask & float_cmask_zero);
    a->cls = float_class_zero;
    a->sign = sign;
    return a;
}

/*
 * Returns the result of multiplying the floating-point values `a' and
 * `b' then adding 'c', with no intermediate rounding step after the
 * multiplication. The operation is performed according to the
 * IEC/IEEE Standard for Binary Floating-Point Arithmetic 754-2008.
 * The flags argument allows the caller to select negation of the
 * addend, the intermediate product, or the final result. (The
 * difference between this and having the caller do a separate
 * negation is that negating externally will flip the sign bit on NaNs.)
 *
 * Requires A and C extracted into a double-sized structure to provide the
 * extra space for the widening multiply.
 */
static FloatPartsN *partsN(muladd)(FloatPartsN *a, FloatPartsN *b,
                                   FloatPartsN *c, int flags, float_status *s)
{
    int ab_mask, abc_mask;
    FloatPartsW p_widen, c_widen;

    ab_mask = float_cmask(a->cls) | float_cmask(b->cls);
    abc_mask = float_cmask(c->cls) | ab_mask;

    /*
     * It is implementation-defined whether the cases of (0,inf,qnan)
     * and (inf,0,qnan) raise InvalidOperation or not (and what QNaN
     * they return if they do), so we have to hand this information
     * off to the target-specific pick-a-NaN routine.
     */
    if (unlikely(abc_mask & float_cmask_anynan)) {
        return parts_pick_nan_muladd(a, b, c, s, ab_mask, abc_mask);
    }

    if (flags & float_muladd_negate_c) {
        c->sign ^= 1;
    }

    /* Compute the sign of the product into A. */
    a->sign ^= b->sign;
    if (flags & float_muladd_negate_product) {
        a->sign ^= 1;
    }

    if (unlikely(ab_mask != float_cmask_normal)) {
        if (unlikely(ab_mask == float_cmask_infzero)) {
            goto d_nan;
        }

        if (ab_mask & float_cmask_inf) {
            if (c->cls == float_class_inf && a->sign != c->sign) {
                goto d_nan;
            }
            goto return_inf;
        }

        g_assert(ab_mask & float_cmask_zero);
        if (c->cls == float_class_normal) {
            *a = *c;
            goto return_normal;
        }
        if (c->cls == float_class_zero) {
            if (a->sign != c->sign) {
                goto return_sub_zero;
            }
            goto return_zero;
        }
        g_assert(c->cls == float_class_inf);
    }

    if (unlikely(c->cls == float_class_inf)) {
        a->sign = c->sign;
        goto return_inf;
    }

    /* Perform the multiplication step. */
    p_widen.sign = a->sign;
    p_widen.exp = a->exp + b->exp + 1;
    frac_mulw(&p_widen, a, b);
    if (!(p_widen.frac_hi & DECOMPOSED_IMPLICIT_BIT)) {
        frac_add(&p_widen, &p_widen, &p_widen);
        p_widen.exp -= 1;
    }

    /* Perform the addition step. */
    if (c->cls != float_class_zero) {
        /* Zero-extend C to less significant bits. */
        frac_widen(&c_widen, c);
        c_widen.exp = c->exp;

        if (a->sign == c->sign) {
            parts_add_normal(&p_widen, &c_widen);
        } else if (!parts_sub_normal(&p_widen, &c_widen)) {
            goto return_sub_zero;
        }
    }

    /* Narrow with sticky bit, for proper rounding later. */
    frac_truncjam(a, &p_widen);
    a->sign = p_widen.sign;
    a->exp = p_widen.exp;

 return_normal:
    if (flags & float_muladd_halve_result) {
        a->exp -= 1;
    }
 finish_sign:
    if (flags & float_muladd_negate_result) {
        a->sign ^= 1;
    }
    return a;

 return_sub_zero:
    a->sign = s->float_rounding_mode == float_round_down;
 return_zero:
    a->cls = float_class_zero;
    goto finish_sign;

 return_inf:
    a->cls = float_class_inf;
    goto finish_sign;

 d_nan:
    float_raise(float_flag_invalid, s);
    parts_default_nan(a, s);
    return a;
}
Commit	Line	Data
7c45bad8 RH	1	/*
	2	* QEMU float support
	3	*
	4	* The code in this source file is derived from release 2a of the SoftFloat
	5	* IEC/IEEE Floating-point Arithmetic Package. Those parts of the code (and
	6	* some later contributions) are provided under that license, as detailed below.
	7	* It has subsequently been modified by contributors to the QEMU Project,
	8	* so some portions are provided under:
	9	* the SoftFloat-2a license
	10	* the BSD license
	11	* GPL-v2-or-later
	12	*
	13	* Any future contributions to this file after December 1st 2014 will be
	14	* taken to be licensed under the Softfloat-2a license unless specifically
	15	* indicated otherwise.
	16	*/
	17
	18	static void partsN(return_nan)(FloatPartsN a, float_status s)
	19	{
	20	switch (a->cls) {
	21	case float_class_snan:
	22	float_raise(float_flag_invalid, s);
	23	if (s->default_nan_mode) {
	24	parts_default_nan(a, s);
	25	} else {
	26	parts_silence_nan(a, s);
	27	}
	28	break;
	29	case float_class_qnan:
	30	if (s->default_nan_mode) {
	31	parts_default_nan(a, s);
	32	}
	33	break;
	34	default:
	35	g_assert_not_reached();
	36	}
	37	}
22c355f4 RH	38
	39	static FloatPartsN partsN(pick_nan)(FloatPartsN a, FloatPartsN *b,
	40	float_status *s)
	41	{
	42	if (is_snan(a->cls) \|\| is_snan(b->cls)) {
	43	float_raise(float_flag_invalid, s);
	44	}
	45
	46	if (s->default_nan_mode) {
	47	parts_default_nan(a, s);
	48	} else {
	49	int cmp = frac_cmp(a, b);
	50	if (cmp == 0) {
	51	cmp = a->sign < b->sign;
	52	}
	53
	54	if (pickNaN(a->cls, b->cls, cmp > 0, s)) {
	55	a = b;
	56	}
	57	if (is_snan(a->cls)) {
	58	parts_silence_nan(a, s);
	59	}
	60	}
	61	return a;
	62	}
979582d0 RH	63
	64	static FloatPartsN partsN(pick_nan_muladd)(FloatPartsN a, FloatPartsN *b,
	65	FloatPartsN c, float_status s,
	66	int ab_mask, int abc_mask)
	67	{
	68	int which;
	69
	70	if (unlikely(abc_mask & float_cmask_snan)) {
	71	float_raise(float_flag_invalid, s);
	72	}
	73
	74	which = pickNaNMulAdd(a->cls, b->cls, c->cls,
	75	ab_mask == float_cmask_infzero, s);
	76
	77	if (s->default_nan_mode \|\| which == 3) {
	78	/*
	79	* Note that this check is after pickNaNMulAdd so that function
	80	* has an opportunity to set the Invalid flag for infzero.
	81	*/
	82	parts_default_nan(a, s);
	83	return a;
	84	}
	85
	86	switch (which) {
	87	case 0:
	88	break;
	89	case 1:
	90	a = b;
	91	break;
	92	case 2:
	93	a = c;
	94	break;
	95	default:
	96	g_assert_not_reached();
	97	}
	98	if (is_snan(a->cls)) {
	99	parts_silence_nan(a, s);
	100	}
	101	return a;
	102	}
d46975bc RH	103
	104	/*
	105	* Canonicalize the FloatParts structure. Determine the class,
	106	* unbias the exponent, and normalize the fraction.
	107	*/
	108	static void partsN(canonicalize)(FloatPartsN p, float_status status,
	109	const FloatFmt *fmt)
	110	{
	111	if (unlikely(p->exp == 0)) {
	112	if (likely(frac_eqz(p))) {
	113	p->cls = float_class_zero;
	114	} else if (status->flush_inputs_to_zero) {
	115	float_raise(float_flag_input_denormal, status);
	116	p->cls = float_class_zero;
	117	frac_clear(p);
	118	} else {
	119	int shift = frac_normalize(p);
	120	p->cls = float_class_normal;
	121	p->exp = fmt->frac_shift - fmt->exp_bias - shift + 1;
	122	}
	123	} else if (likely(p->exp < fmt->exp_max) \|\| fmt->arm_althp) {
	124	p->cls = float_class_normal;
	125	p->exp -= fmt->exp_bias;
	126	frac_shl(p, fmt->frac_shift);
	127	p->frac_hi \|= DECOMPOSED_IMPLICIT_BIT;
	128	} else if (likely(frac_eqz(p))) {
	129	p->cls = float_class_inf;
	130	} else {
	131	frac_shl(p, fmt->frac_shift);
	132	p->cls = (parts_is_snan_frac(p->frac_hi, status)
	133	? float_class_snan : float_class_qnan);
	134	}
	135	}
ee6959f2 RH	136
	137	/*
	138	* Round and uncanonicalize a floating-point number by parts. There
	139	* are FRAC_SHIFT bits that may require rounding at the bottom of the
	140	* fraction; these bits will be removed. The exponent will be biased
	141	* by EXP_BIAS and must be bounded by [EXP_MAX-1, 0].
	142	*/
	143	static void partsN(uncanon)(FloatPartsN p, float_status s,
	144	const FloatFmt *fmt)
	145	{
	146	const int exp_max = fmt->exp_max;
	147	const int frac_shift = fmt->frac_shift;
	148	const uint64_t frac_lsb = fmt->frac_lsb;
	149	const uint64_t frac_lsbm1 = fmt->frac_lsbm1;
	150	const uint64_t round_mask = fmt->round_mask;
	151	const uint64_t roundeven_mask = fmt->roundeven_mask;
	152	uint64_t inc;
	153	bool overflow_norm;
	154	int exp, flags = 0;
	155
	156	if (unlikely(p->cls != float_class_normal)) {
	157	switch (p->cls) {
	158	case float_class_zero:
	159	p->exp = 0;
	160	frac_clear(p);
	161	return;
	162	case float_class_inf:
	163	g_assert(!fmt->arm_althp);
	164	p->exp = fmt->exp_max;
	165	frac_clear(p);
	166	return;
	167	case float_class_qnan:
	168	case float_class_snan:
	169	g_assert(!fmt->arm_althp);
	170	p->exp = fmt->exp_max;
	171	frac_shr(p, fmt->frac_shift);
	172	return;
	173	default:
	174	break;
	175	}
	176	g_assert_not_reached();
	177	}
	178
	179	switch (s->float_rounding_mode) {
	180	case float_round_nearest_even:
	181	overflow_norm = false;
	182	inc = ((p->frac_lo & roundeven_mask) != frac_lsbm1 ? frac_lsbm1 : 0);
	183	break;
	184	case float_round_ties_away:
	185	overflow_norm = false;
	186	inc = frac_lsbm1;
	187	break;
	188	case float_round_to_zero:
	189	overflow_norm = true;
	190	inc = 0;
	191	break;
	192	case float_round_up:
	193	inc = p->sign ? 0 : round_mask;
	194	overflow_norm = p->sign;
	195	break;
	196	case float_round_down:
	197	inc = p->sign ? round_mask : 0;
	198	overflow_norm = !p->sign;
	199	break;
200	case float_round_to_odd:
201	overflow_norm = true;
202	inc = p->frac_lo & frac_lsb ? 0 : round_mask;
203	break;
204	default:
205	g_assert_not_reached();
206	}
207
208	exp = p->exp + fmt->exp_bias;
209	if (likely(exp > 0)) {
210	if (p->frac_lo & round_mask) {
211	flags \|= float_flag_inexact;
212	if (frac_addi(p, p, inc)) {
213	frac_shr(p, 1);
214	p->frac_hi \|= DECOMPOSED_IMPLICIT_BIT;
215	exp++;
216	}
217	}
218	frac_shr(p, frac_shift);
219
220	if (fmt->arm_althp) {
221	/* ARM Alt HP eschews Inf and NaN for a wider exponent. */
222	if (unlikely(exp > exp_max)) {
223	/* Overflow. Return the maximum normal. */
224	flags = float_flag_invalid;
225	exp = exp_max;
226	frac_allones(p);
227	}
228	} else if (unlikely(exp >= exp_max)) {
229	flags \|= float_flag_overflow \| float_flag_inexact;
230	if (overflow_norm) {
231	exp = exp_max - 1;
232	frac_allones(p);
233	} else {
234	p->cls = float_class_inf;
235	exp = exp_max;
236	frac_clear(p);
237	}
238	}
239	} else if (s->flush_to_zero) {
240	flags \|= float_flag_output_denormal;
241	p->cls = float_class_zero;
242	exp = 0;
243	frac_clear(p);
244	} else {
245	bool is_tiny = s->tininess_before_rounding \|\| exp < 0;
246
247	if (!is_tiny) {
248	FloatPartsN discard;
249	is_tiny = !frac_addi(&discard, p, inc);
250	}
251
252	frac_shrjam(p, 1 - exp);
253
254	if (p->frac_lo & round_mask) {
255	/* Need to recompute round-to-even/round-to-odd. */
256	switch (s->float_rounding_mode) {
257	case float_round_nearest_even:
258	inc = ((p->frac_lo & roundeven_mask) != frac_lsbm1
259	? frac_lsbm1 : 0);
260	break;
261	case float_round_to_odd:
262	inc = p->frac_lo & frac_lsb ? 0 : round_mask;
263	break;
264	default:
265	break;
266	}
267	flags \|= float_flag_inexact;
268	frac_addi(p, p, inc);
269	}
270
271	exp = (p->frac_hi & DECOMPOSED_IMPLICIT_BIT) != 0;
272	frac_shr(p, frac_shift);
273
274	if (is_tiny && (flags & float_flag_inexact)) {
275	flags \|= float_flag_underflow;
276	}
277	if (exp == 0 && frac_eqz(p)) {
278	p->cls = float_class_zero;
279	}
280	}
281	p->exp = exp;
282	float_raise(flags, s);
283	}
da10a907 RH	284
	285	/*
	286	* Returns the result of adding or subtracting the values of the
	287	* floating-point values `a' and `b'. The operation is performed
	288	* according to the IEC/IEEE Standard for Binary Floating-Point
	289	* Arithmetic.
	290	*/
	291	static FloatPartsN partsN(addsub)(FloatPartsN a, FloatPartsN *b,
	292	float_status *s, bool subtract)
	293	{
	294	bool b_sign = b->sign ^ subtract;
	295	int ab_mask = float_cmask(a->cls) \| float_cmask(b->cls);
	296
	297	if (a->sign != b_sign) {
	298	/* Subtraction */
	299	if (likely(ab_mask == float_cmask_normal)) {
	300	if (parts_sub_normal(a, b)) {
	301	return a;
	302	}
	303	/* Subtract was exact, fall through to set sign. */
	304	ab_mask = float_cmask_zero;
	305	}
	306
	307	if (ab_mask == float_cmask_zero) {
	308	a->sign = s->float_rounding_mode == float_round_down;
	309	return a;
	310	}
	311
	312	if (unlikely(ab_mask & float_cmask_anynan)) {
	313	goto p_nan;
	314	}
	315
	316	if (ab_mask & float_cmask_inf) {
	317	if (a->cls != float_class_inf) {
	318	/* N - Inf */
	319	goto return_b;
	320	}
	321	if (b->cls != float_class_inf) {
	322	/* Inf - N */
	323	return a;
	324	}
	325	/* Inf - Inf */
	326	float_raise(float_flag_invalid, s);
	327	parts_default_nan(a, s);
	328	return a;
	329	}
	330	} else {
	331	/* Addition */
	332	if (likely(ab_mask == float_cmask_normal)) {
	333	parts_add_normal(a, b);
	334	return a;
	335	}
	336
	337	if (ab_mask == float_cmask_zero) {
	338	return a;
	339	}
	340
	341	if (unlikely(ab_mask & float_cmask_anynan)) {
	342	goto p_nan;
	343	}
	344
	345	if (ab_mask & float_cmask_inf) {
	346	a->cls = float_class_inf;
	347	return a;
348	}
349	}
350
351	if (b->cls == float_class_zero) {
352	g_assert(a->cls == float_class_normal);
353	return a;
354	}
355
356	g_assert(a->cls == float_class_zero);
357	g_assert(b->cls == float_class_normal);
358	return_b:
359	b->sign = b_sign;
360	return b;
361
362	p_nan:
363	return parts_pick_nan(a, b, s);
364	}
aca84527 RH	365
	366	/*
	367	* Returns the result of multiplying the floating-point values `a' and
	368	* `b'. The operation is performed according to the IEC/IEEE Standard
	369	* for Binary Floating-Point Arithmetic.
	370	*/
	371	static FloatPartsN partsN(mul)(FloatPartsN a, FloatPartsN *b,
	372	float_status *s)
	373	{
	374	int ab_mask = float_cmask(a->cls) \| float_cmask(b->cls);
	375	bool sign = a->sign ^ b->sign;
	376
	377	if (likely(ab_mask == float_cmask_normal)) {
	378	FloatPartsW tmp;
	379
	380	frac_mulw(&tmp, a, b);
	381	frac_truncjam(a, &tmp);
	382
	383	a->exp += b->exp + 1;
	384	if (!(a->frac_hi & DECOMPOSED_IMPLICIT_BIT)) {
	385	frac_add(a, a, a);
	386	a->exp -= 1;
	387	}
	388
	389	a->sign = sign;
	390	return a;
	391	}
	392
	393	/* Inf * Zero == NaN */
	394	if (unlikely(ab_mask == float_cmask_infzero)) {
	395	float_raise(float_flag_invalid, s);
	396	parts_default_nan(a, s);
	397	return a;
	398	}
	399
	400	if (unlikely(ab_mask & float_cmask_anynan)) {
	401	return parts_pick_nan(a, b, s);
	402	}
	403
	404	/* Multiply by 0 or Inf */
	405	if (ab_mask & float_cmask_inf) {
	406	a->cls = float_class_inf;
	407	a->sign = sign;
	408	return a;
	409	}
	410
	411	g_assert(ab_mask & float_cmask_zero);
	412	a->cls = float_class_zero;
	413	a->sign = sign;
	414	return a;
	415	}
dedd123c RH	416
	417	/*
	418	* Returns the result of multiplying the floating-point values `a' and
	419	* `b' then adding 'c', with no intermediate rounding step after the
	420	* multiplication. The operation is performed according to the
	421	* IEC/IEEE Standard for Binary Floating-Point Arithmetic 754-2008.
	422	* The flags argument allows the caller to select negation of the
	423	* addend, the intermediate product, or the final result. (The
	424	* difference between this and having the caller do a separate
	425	* negation is that negating externally will flip the sign bit on NaNs.)
	426	*
	427	* Requires A and C extracted into a double-sized structure to provide the
	428	* extra space for the widening multiply.
	429	*/
	430	static FloatPartsN partsN(muladd)(FloatPartsN a, FloatPartsN *b,
	431	FloatPartsN c, int flags, float_status s)
	432	{
	433	int ab_mask, abc_mask;
	434	FloatPartsW p_widen, c_widen;
	435
	436	ab_mask = float_cmask(a->cls) \| float_cmask(b->cls);
	437	abc_mask = float_cmask(c->cls) \| ab_mask;
	438
	439	/*
	440	* It is implementation-defined whether the cases of (0,inf,qnan)
	441	* and (inf,0,qnan) raise InvalidOperation or not (and what QNaN
	442	* they return if they do), so we have to hand this information
	443	* off to the target-specific pick-a-NaN routine.
	444	*/
	445	if (unlikely(abc_mask & float_cmask_anynan)) {
	446	return parts_pick_nan_muladd(a, b, c, s, ab_mask, abc_mask);
	447	}
	448
	449	if (flags & float_muladd_negate_c) {
	450	c->sign ^= 1;
	451	}
	452
	453	/* Compute the sign of the product into A. */
	454	a->sign ^= b->sign;
	455	if (flags & float_muladd_negate_product) {
	456	a->sign ^= 1;
	457	}
	458
	459	if (unlikely(ab_mask != float_cmask_normal)) {
	460	if (unlikely(ab_mask == float_cmask_infzero)) {
	461	goto d_nan;
	462	}
	463
	464	if (ab_mask & float_cmask_inf) {
	465	if (c->cls == float_class_inf && a->sign != c->sign) {
	466	goto d_nan;
	467	}
	468	goto return_inf;
	469	}
	470
	471	g_assert(ab_mask & float_cmask_zero);
	472	if (c->cls == float_class_normal) {
	473	a = c;
	474	goto return_normal;
	475	}
	476	if (c->cls == float_class_zero) {
	477	if (a->sign != c->sign) {
	478	goto return_sub_zero;
	479	}
480	goto return_zero;
481	}
482	g_assert(c->cls == float_class_inf);
483	}
484
485	if (unlikely(c->cls == float_class_inf)) {
486	a->sign = c->sign;
487	goto return_inf;
488	}
489
490	/* Perform the multiplication step. */
491	p_widen.sign = a->sign;
492	p_widen.exp = a->exp + b->exp + 1;
493	frac_mulw(&p_widen, a, b);
494	if (!(p_widen.frac_hi & DECOMPOSED_IMPLICIT_BIT)) {
495	frac_add(&p_widen, &p_widen, &p_widen);
496	p_widen.exp -= 1;
497	}
498
499	/* Perform the addition step. */
500	if (c->cls != float_class_zero) {
501	/* Zero-extend C to less significant bits. */
502	frac_widen(&c_widen, c);
503	c_widen.exp = c->exp;
504
505	if (a->sign == c->sign) {
506	parts_add_normal(&p_widen, &c_widen);
507	} else if (!parts_sub_normal(&p_widen, &c_widen)) {
508	goto return_sub_zero;
509	}
510	}
511
512	/* Narrow with sticky bit, for proper rounding later. */
513	frac_truncjam(a, &p_widen);
514	a->sign = p_widen.sign;
515	a->exp = p_widen.exp;
516
517	return_normal:
518	if (flags & float_muladd_halve_result) {
519	a->exp -= 1;
520	}
521	finish_sign:
522	if (flags & float_muladd_negate_result) {
523	a->sign ^= 1;
524	}
525	return a;
526
527	return_sub_zero:
528	a->sign = s->float_rounding_mode == float_round_down;
529	return_zero:
530	a->cls = float_class_zero;
531	goto finish_sign;
532
533	return_inf:
534	a->cls = float_class_inf;
535	goto finish_sign;
536
537	d_nan:
538	float_raise(float_flag_invalid, s);
539	parts_default_nan(a, s);
540	return a;
541	}