src/util/softfloat.c

bf215546Sopenharmony_ci/*
bf215546Sopenharmony_ci * License for Berkeley SoftFloat Release 3e
bf215546Sopenharmony_ci *
bf215546Sopenharmony_ci * John R. Hauser
bf215546Sopenharmony_ci * 2018 January 20
bf215546Sopenharmony_ci *
bf215546Sopenharmony_ci * The following applies to the whole of SoftFloat Release 3e as well as to
bf215546Sopenharmony_ci * each source file individually.
bf215546Sopenharmony_ci *
bf215546Sopenharmony_ci * Copyright 2011, 2012, 2013, 2014, 2015, 2016, 2017, 2018 The Regents of the
bf215546Sopenharmony_ci * University of California.  All rights reserved.
bf215546Sopenharmony_ci *
bf215546Sopenharmony_ci * Redistribution and use in source and binary forms, with or without
bf215546Sopenharmony_ci * modification, are permitted provided that the following conditions are met:
bf215546Sopenharmony_ci *
bf215546Sopenharmony_ci *  1. Redistributions of source code must retain the above copyright notice,
bf215546Sopenharmony_ci *     this list of conditions, and the following disclaimer.
bf215546Sopenharmony_ci *
bf215546Sopenharmony_ci *  2. Redistributions in binary form must reproduce the above copyright
bf215546Sopenharmony_ci *     notice, this list of conditions, and the following disclaimer in the
bf215546Sopenharmony_ci *     documentation and/or other materials provided with the distribution.
bf215546Sopenharmony_ci *
bf215546Sopenharmony_ci *  3. Neither the name of the University nor the names of its contributors
bf215546Sopenharmony_ci *     may be used to endorse or promote products derived from this software
bf215546Sopenharmony_ci *     without specific prior written permission.
bf215546Sopenharmony_ci *
bf215546Sopenharmony_ci * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY
bf215546Sopenharmony_ci * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
bf215546Sopenharmony_ci * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE
bf215546Sopenharmony_ci * DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY
bf215546Sopenharmony_ci * DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
bf215546Sopenharmony_ci * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
bf215546Sopenharmony_ci * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
bf215546Sopenharmony_ci * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
bf215546Sopenharmony_ci * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
bf215546Sopenharmony_ci * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
bf215546Sopenharmony_ci *
bf215546Sopenharmony_ci *
bf215546Sopenharmony_ci * The functions listed in this file are modified versions of the ones
bf215546Sopenharmony_ci * from the Berkeley SoftFloat 3e Library.
bf215546Sopenharmony_ci *
bf215546Sopenharmony_ci * Their implementation correctness has been checked with the Berkeley
bf215546Sopenharmony_ci * TestFloat Release 3e tool for x86_64.
bf215546Sopenharmony_ci */
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci#include "rounding.h"
bf215546Sopenharmony_ci#include "bitscan.h"
bf215546Sopenharmony_ci#include "softfloat.h"
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci#if defined(BIG_ENDIAN)
bf215546Sopenharmony_ci#define word_incr -1
bf215546Sopenharmony_ci#define index_word(total, n) ((total) - 1 - (n))
bf215546Sopenharmony_ci#define index_word_hi(total) 0
bf215546Sopenharmony_ci#define index_word_lo(total) ((total) - 1)
bf215546Sopenharmony_ci#define index_multiword_hi(total, n) 0
bf215546Sopenharmony_ci#define index_multiword_lo(total, n) ((total) - (n))
bf215546Sopenharmony_ci#define index_multiword_hi_but(total, n) 0
bf215546Sopenharmony_ci#define index_multiword_lo_but(total, n) (n)
bf215546Sopenharmony_ci#else
bf215546Sopenharmony_ci#define word_incr 1
bf215546Sopenharmony_ci#define index_word(total, n) (n)
bf215546Sopenharmony_ci#define index_word_hi(total) ((total) - 1)
bf215546Sopenharmony_ci#define index_word_lo(total) 0
bf215546Sopenharmony_ci#define index_multiword_hi(total, n) ((total) - (n))
bf215546Sopenharmony_ci#define index_multiword_lo(total, n) 0
bf215546Sopenharmony_ci#define index_multiword_hi_but(total, n) (n)
bf215546Sopenharmony_ci#define index_multiword_lo_but(total, n) 0
bf215546Sopenharmony_ci#endif
bf215546Sopenharmony_ci
bf215546Sopenharmony_citypedef union { double f; int64_t i; uint64_t u; } di_type;
bf215546Sopenharmony_citypedef union { float f; int32_t i; uint32_t u; } fi_type;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ciconst uint8_t count_leading_zeros8[256] = {
bf215546Sopenharmony_ci    8, 7, 6, 6, 5, 5, 5, 5, 4, 4, 4, 4, 4, 4, 4, 4,
bf215546Sopenharmony_ci    3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3,
bf215546Sopenharmony_ci    2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
bf215546Sopenharmony_ci    2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
bf215546Sopenharmony_ci    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
bf215546Sopenharmony_ci    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
bf215546Sopenharmony_ci    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
bf215546Sopenharmony_ci    1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
bf215546Sopenharmony_ci    0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
bf215546Sopenharmony_ci    0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
bf215546Sopenharmony_ci    0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
bf215546Sopenharmony_ci    0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
bf215546Sopenharmony_ci    0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
bf215546Sopenharmony_ci    0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
bf215546Sopenharmony_ci    0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
bf215546Sopenharmony_ci    0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0
bf215546Sopenharmony_ci};
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci/**
bf215546Sopenharmony_ci * \brief Shifts 'a' right by the number of bits given in 'dist', which must be in
bf215546Sopenharmony_ci * the range 1 to 63.  If any nonzero bits are shifted off, they are "jammed"
bf215546Sopenharmony_ci * into the least-significant bit of the shifted value by setting the
bf215546Sopenharmony_ci * least-significant bit to 1.  This shifted-and-jammed value is returned.
bf215546Sopenharmony_ci *
bf215546Sopenharmony_ci * From softfloat_shortShiftRightJam64()
bf215546Sopenharmony_ci */
bf215546Sopenharmony_cistatic inline
bf215546Sopenharmony_ciuint64_t _mesa_short_shift_right_jam64(uint64_t a, uint8_t dist)
bf215546Sopenharmony_ci{
bf215546Sopenharmony_ci    return a >> dist | ((a & (((uint64_t) 1 << dist) - 1)) != 0);
bf215546Sopenharmony_ci}
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci/**
bf215546Sopenharmony_ci * \brief Shifts 'a' right by the number of bits given in 'dist', which must not
bf215546Sopenharmony_ci * be zero.  If any nonzero bits are shifted off, they are "jammed" into the
bf215546Sopenharmony_ci * least-significant bit of the shifted value by setting the least-significant
bf215546Sopenharmony_ci * bit to 1.  This shifted-and-jammed value is returned.
bf215546Sopenharmony_ci * The value of 'dist' can be arbitrarily large.  In particular, if 'dist' is
bf215546Sopenharmony_ci * greater than 64, the result will be either 0 or 1, depending on whether 'a'
bf215546Sopenharmony_ci * is zero or nonzero.
bf215546Sopenharmony_ci *
bf215546Sopenharmony_ci * From softfloat_shiftRightJam64()
bf215546Sopenharmony_ci */
bf215546Sopenharmony_cistatic inline
bf215546Sopenharmony_ciuint64_t _mesa_shift_right_jam64(uint64_t a, uint32_t dist)
bf215546Sopenharmony_ci{
bf215546Sopenharmony_ci    return
bf215546Sopenharmony_ci        (dist < 63) ? a >> dist | ((uint64_t) (a << (-dist & 63)) != 0) : (a != 0);
bf215546Sopenharmony_ci}
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci/**
bf215546Sopenharmony_ci * \brief Shifts 'a' right by the number of bits given in 'dist', which must not be
bf215546Sopenharmony_ci * zero.  If any nonzero bits are shifted off, they are "jammed" into the
bf215546Sopenharmony_ci * least-significant bit of the shifted value by setting the least-significant
bf215546Sopenharmony_ci * bit to 1.  This shifted-and-jammed value is returned.
bf215546Sopenharmony_ci * The value of 'dist' can be arbitrarily large.  In particular, if 'dist' is
bf215546Sopenharmony_ci * greater than 32, the result will be either 0 or 1, depending on whether 'a'
bf215546Sopenharmony_ci * is zero or nonzero.
bf215546Sopenharmony_ci *
bf215546Sopenharmony_ci * From softfloat_shiftRightJam32()
bf215546Sopenharmony_ci */
bf215546Sopenharmony_cistatic inline
bf215546Sopenharmony_ciuint32_t _mesa_shift_right_jam32(uint32_t a, uint16_t dist)
bf215546Sopenharmony_ci{
bf215546Sopenharmony_ci    return
bf215546Sopenharmony_ci        (dist < 31) ? a >> dist | ((uint32_t) (a << (-dist & 31)) != 0) : (a != 0);
bf215546Sopenharmony_ci}
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci/**
bf215546Sopenharmony_ci * \brief Extracted from softfloat_roundPackToF64()
bf215546Sopenharmony_ci */
bf215546Sopenharmony_cistatic inline
bf215546Sopenharmony_cidouble _mesa_roundtozero_f64(int64_t s, int64_t e, int64_t m)
bf215546Sopenharmony_ci{
bf215546Sopenharmony_ci    di_type result;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    if ((uint64_t) e >= 0x7fd) {
bf215546Sopenharmony_ci        if (e < 0) {
bf215546Sopenharmony_ci            m = _mesa_shift_right_jam64(m, -e);
bf215546Sopenharmony_ci            e = 0;
bf215546Sopenharmony_ci        } else if ((e > 0x7fd) || (0x8000000000000000 <= m)) {
bf215546Sopenharmony_ci            e = 0x7ff;
bf215546Sopenharmony_ci            m = 0;
bf215546Sopenharmony_ci            result.u = (s << 63) + (e << 52) + m;
bf215546Sopenharmony_ci            result.u -= 1;
bf215546Sopenharmony_ci            return result.f;
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    m >>= 10;
bf215546Sopenharmony_ci    if (m == 0)
bf215546Sopenharmony_ci        e = 0;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    result.u = (s << 63) + (e << 52) + m;
bf215546Sopenharmony_ci    return result.f;
bf215546Sopenharmony_ci}
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci/**
bf215546Sopenharmony_ci * \brief Extracted from softfloat_roundPackToF32()
bf215546Sopenharmony_ci */
bf215546Sopenharmony_cistatic inline
bf215546Sopenharmony_cifloat _mesa_round_f32(int32_t s, int32_t e, int32_t m, bool rtz)
bf215546Sopenharmony_ci{
bf215546Sopenharmony_ci    fi_type result;
bf215546Sopenharmony_ci    uint8_t round_increment = rtz ? 0 : 0x40;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    if ((uint32_t) e >= 0xfd) {
bf215546Sopenharmony_ci        if (e < 0) {
bf215546Sopenharmony_ci            m = _mesa_shift_right_jam32(m, -e);
bf215546Sopenharmony_ci            e = 0;
bf215546Sopenharmony_ci        } else if ((e > 0xfd) || (0x80000000 <= m + round_increment)) {
bf215546Sopenharmony_ci            e = 0xff;
bf215546Sopenharmony_ci            m = 0;
bf215546Sopenharmony_ci            result.u = (s << 31) + (e << 23) + m;
bf215546Sopenharmony_ci            result.u -= !round_increment;
bf215546Sopenharmony_ci            return result.f;
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    uint8_t round_bits;
bf215546Sopenharmony_ci    round_bits = m & 0x7f;
bf215546Sopenharmony_ci    m = ((uint32_t) m + round_increment) >> 7;
bf215546Sopenharmony_ci    m &= ~(uint32_t) (! (round_bits ^ 0x40) & !rtz);
bf215546Sopenharmony_ci    if (m == 0)
bf215546Sopenharmony_ci        e = 0;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    result.u = (s << 31) + (e << 23) + m;
bf215546Sopenharmony_ci    return result.f;
bf215546Sopenharmony_ci}
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci/**
bf215546Sopenharmony_ci * \brief Extracted from softfloat_roundPackToF16()
bf215546Sopenharmony_ci */
bf215546Sopenharmony_cistatic inline
bf215546Sopenharmony_ciuint16_t _mesa_roundtozero_f16(int16_t s, int16_t e, int16_t m)
bf215546Sopenharmony_ci{
bf215546Sopenharmony_ci    if ((uint16_t) e >= 0x1d) {
bf215546Sopenharmony_ci        if (e < 0) {
bf215546Sopenharmony_ci            m = _mesa_shift_right_jam32(m, -e);
bf215546Sopenharmony_ci            e = 0;
bf215546Sopenharmony_ci        } else if (e > 0x1d) {
bf215546Sopenharmony_ci            e = 0x1f;
bf215546Sopenharmony_ci            m = 0;
bf215546Sopenharmony_ci            return (s << 15) + (e << 10) + m - 1;
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    m >>= 4;
bf215546Sopenharmony_ci    if (m == 0)
bf215546Sopenharmony_ci        e = 0;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    return (s << 15) + (e << 10) + m;
bf215546Sopenharmony_ci}
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci/**
bf215546Sopenharmony_ci * \brief Shifts the N-bit unsigned integer pointed to by 'a' left by the number of
bf215546Sopenharmony_ci * bits given in 'dist', where N = 'size_words' * 32.  The value of 'dist'
bf215546Sopenharmony_ci * must be in the range 1 to 31.  Any nonzero bits shifted off are lost.  The
bf215546Sopenharmony_ci * shifted N-bit result is stored at the location pointed to by 'm_out'.  Each
bf215546Sopenharmony_ci * of 'a' and 'm_out' points to a 'size_words'-long array of 32-bit elements
bf215546Sopenharmony_ci * that concatenate in the platform's normal endian order to form an N-bit
bf215546Sopenharmony_ci * integer.
bf215546Sopenharmony_ci *
bf215546Sopenharmony_ci * From softfloat_shortShiftLeftM()
bf215546Sopenharmony_ci */
bf215546Sopenharmony_cistatic inline void
bf215546Sopenharmony_ci_mesa_short_shift_left_m(uint8_t size_words, const uint32_t *a, uint8_t dist, uint32_t *m_out)
bf215546Sopenharmony_ci{
bf215546Sopenharmony_ci    uint8_t neg_dist;
bf215546Sopenharmony_ci    unsigned index, last_index;
bf215546Sopenharmony_ci    uint32_t part_word, a_word;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    neg_dist = -dist;
bf215546Sopenharmony_ci    index = index_word_hi(size_words);
bf215546Sopenharmony_ci    last_index = index_word_lo(size_words);
bf215546Sopenharmony_ci    part_word = a[index] << dist;
bf215546Sopenharmony_ci    while (index != last_index) {
bf215546Sopenharmony_ci        a_word = a[index - word_incr];
bf215546Sopenharmony_ci        m_out[index] = part_word | a_word >> (neg_dist & 31);
bf215546Sopenharmony_ci        index -= word_incr;
bf215546Sopenharmony_ci        part_word = a_word << dist;
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci    m_out[index] = part_word;
bf215546Sopenharmony_ci}
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci/**
bf215546Sopenharmony_ci * \brief Shifts the N-bit unsigned integer pointed to by 'a' left by the number of
bf215546Sopenharmony_ci * bits given in 'dist', where N = 'size_words' * 32.  The value of 'dist'
bf215546Sopenharmony_ci * must not be zero.  Any nonzero bits shifted off are lost.  The shifted
bf215546Sopenharmony_ci * N-bit result is stored at the location pointed to by 'm_out'.  Each of 'a'
bf215546Sopenharmony_ci * and 'm_out' points to a 'size_words'-long array of 32-bit elements that
bf215546Sopenharmony_ci * concatenate in the platform's normal endian order to form an N-bit
bf215546Sopenharmony_ci * integer. The value of 'dist' can be arbitrarily large.  In particular, if
bf215546Sopenharmony_ci * 'dist' is greater than N, the stored result will be 0.
bf215546Sopenharmony_ci *
bf215546Sopenharmony_ci * From softfloat_shiftLeftM()
bf215546Sopenharmony_ci */
bf215546Sopenharmony_cistatic inline void
bf215546Sopenharmony_ci_mesa_shift_left_m(uint8_t size_words, const uint32_t *a, uint32_t dist, uint32_t *m_out)
bf215546Sopenharmony_ci{
bf215546Sopenharmony_ci    uint32_t word_dist;
bf215546Sopenharmony_ci    uint8_t inner_dist;
bf215546Sopenharmony_ci    uint8_t i;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    word_dist = dist >> 5;
bf215546Sopenharmony_ci    if (word_dist < size_words) {
bf215546Sopenharmony_ci        a += index_multiword_lo_but(size_words, word_dist);
bf215546Sopenharmony_ci        inner_dist = dist & 31;
bf215546Sopenharmony_ci        if (inner_dist) {
bf215546Sopenharmony_ci            _mesa_short_shift_left_m(size_words - word_dist, a, inner_dist,
bf215546Sopenharmony_ci                                     m_out + index_multiword_hi_but(size_words, word_dist));
bf215546Sopenharmony_ci            if (!word_dist)
bf215546Sopenharmony_ci                return;
bf215546Sopenharmony_ci        } else {
bf215546Sopenharmony_ci            uint32_t *dest = m_out + index_word_hi(size_words);
bf215546Sopenharmony_ci            a += index_word_hi(size_words - word_dist);
bf215546Sopenharmony_ci            for (i = size_words - word_dist; i; --i) {
bf215546Sopenharmony_ci                *dest = *a;
bf215546Sopenharmony_ci                a -= word_incr;
bf215546Sopenharmony_ci                dest -= word_incr;
bf215546Sopenharmony_ci            }
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci        m_out += index_multiword_lo(size_words, word_dist);
bf215546Sopenharmony_ci    } else {
bf215546Sopenharmony_ci        word_dist = size_words;
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci    do {
bf215546Sopenharmony_ci        *m_out++ = 0;
bf215546Sopenharmony_ci        --word_dist;
bf215546Sopenharmony_ci    } while (word_dist);
bf215546Sopenharmony_ci}
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci/**
bf215546Sopenharmony_ci * \brief Shifts the N-bit unsigned integer pointed to by 'a' right by the number of
bf215546Sopenharmony_ci * bits given in 'dist', where N = 'size_words' * 32.  The value of 'dist'
bf215546Sopenharmony_ci * must be in the range 1 to 31.  Any nonzero bits shifted off are lost.  The
bf215546Sopenharmony_ci * shifted N-bit result is stored at the location pointed to by 'm_out'.  Each
bf215546Sopenharmony_ci * of 'a' and 'm_out' points to a 'size_words'-long array of 32-bit elements
bf215546Sopenharmony_ci * that concatenate in the platform's normal endian order to form an N-bit
bf215546Sopenharmony_ci * integer.
bf215546Sopenharmony_ci *
bf215546Sopenharmony_ci * From softfloat_shortShiftRightM()
bf215546Sopenharmony_ci */
bf215546Sopenharmony_cistatic inline void
bf215546Sopenharmony_ci_mesa_short_shift_right_m(uint8_t size_words, const uint32_t *a, uint8_t dist, uint32_t *m_out)
bf215546Sopenharmony_ci{
bf215546Sopenharmony_ci    uint8_t neg_dist;
bf215546Sopenharmony_ci    unsigned index, last_index;
bf215546Sopenharmony_ci    uint32_t part_word, a_word;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    neg_dist = -dist;
bf215546Sopenharmony_ci    index = index_word_lo(size_words);
bf215546Sopenharmony_ci    last_index = index_word_hi(size_words);
bf215546Sopenharmony_ci    part_word = a[index] >> dist;
bf215546Sopenharmony_ci    while (index != last_index) {
bf215546Sopenharmony_ci        a_word = a[index + word_incr];
bf215546Sopenharmony_ci        m_out[index] = a_word << (neg_dist & 31) | part_word;
bf215546Sopenharmony_ci        index += word_incr;
bf215546Sopenharmony_ci        part_word = a_word >> dist;
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci    m_out[index] = part_word;
bf215546Sopenharmony_ci}
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci/**
bf215546Sopenharmony_ci * \brief Shifts the N-bit unsigned integer pointed to by 'a' right by the number of
bf215546Sopenharmony_ci * bits given in 'dist', where N = 'size_words' * 32.  The value of 'dist'
bf215546Sopenharmony_ci * must be in the range 1 to 31.  If any nonzero bits are shifted off, they
bf215546Sopenharmony_ci * are "jammed" into the least-significant bit of the shifted value by setting
bf215546Sopenharmony_ci * the least-significant bit to 1.  This shifted-and-jammed N-bit result is
bf215546Sopenharmony_ci * stored at the location pointed to by 'm_out'.  Each of 'a' and 'm_out'
bf215546Sopenharmony_ci * points to a 'size_words'-long array of 32-bit elements that concatenate in
bf215546Sopenharmony_ci * the platform's normal endian order to form an N-bit integer.
bf215546Sopenharmony_ci *
bf215546Sopenharmony_ci *
bf215546Sopenharmony_ci * From softfloat_shortShiftRightJamM()
bf215546Sopenharmony_ci */
bf215546Sopenharmony_cistatic inline void
bf215546Sopenharmony_ci_mesa_short_shift_right_jam_m(uint8_t size_words, const uint32_t *a, uint8_t dist, uint32_t *m_out)
bf215546Sopenharmony_ci{
bf215546Sopenharmony_ci    uint8_t neg_dist;
bf215546Sopenharmony_ci    unsigned index, last_index;
bf215546Sopenharmony_ci    uint64_t part_word, a_word;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    neg_dist = -dist;
bf215546Sopenharmony_ci    index = index_word_lo(size_words);
bf215546Sopenharmony_ci    last_index = index_word_hi(size_words);
bf215546Sopenharmony_ci    a_word = a[index];
bf215546Sopenharmony_ci    part_word = a_word >> dist;
bf215546Sopenharmony_ci    if (part_word << dist != a_word )
bf215546Sopenharmony_ci        part_word |= 1;
bf215546Sopenharmony_ci    while (index != last_index) {
bf215546Sopenharmony_ci        a_word = a[index + word_incr];
bf215546Sopenharmony_ci        m_out[index] = a_word << (neg_dist & 31) | part_word;
bf215546Sopenharmony_ci        index += word_incr;
bf215546Sopenharmony_ci        part_word = a_word >> dist;
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci    m_out[index] = part_word;
bf215546Sopenharmony_ci}
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci/**
bf215546Sopenharmony_ci * \brief Shifts the N-bit unsigned integer pointed to by 'a' right by the number of
bf215546Sopenharmony_ci * bits given in 'dist', where N = 'size_words' * 32.  The value of 'dist'
bf215546Sopenharmony_ci * must not be zero.  If any nonzero bits are shifted off, they are "jammed"
bf215546Sopenharmony_ci * into the least-significant bit of the shifted value by setting the
bf215546Sopenharmony_ci * least-significant bit to 1.  This shifted-and-jammed N-bit result is stored
bf215546Sopenharmony_ci * at the location pointed to by 'm_out'.  Each of 'a' and 'm_out' points to a
bf215546Sopenharmony_ci * 'size_words'-long array of 32-bit elements that concatenate in the
bf215546Sopenharmony_ci * platform's normal endian order to form an N-bit integer.  The value of
bf215546Sopenharmony_ci * 'dist' can be arbitrarily large.  In particular, if 'dist' is greater than
bf215546Sopenharmony_ci * N, the stored result will be either 0 or 1, depending on whether the
bf215546Sopenharmony_ci * original N bits are all zeros.
bf215546Sopenharmony_ci *
bf215546Sopenharmony_ci * From softfloat_shiftRightJamM()
bf215546Sopenharmony_ci */
bf215546Sopenharmony_cistatic inline void
bf215546Sopenharmony_ci_mesa_shift_right_jam_m(uint8_t size_words, const uint32_t *a, uint32_t dist, uint32_t *m_out)
bf215546Sopenharmony_ci{
bf215546Sopenharmony_ci    uint32_t word_jam, word_dist, *tmp;
bf215546Sopenharmony_ci    uint8_t i, inner_dist;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    word_jam = 0;
bf215546Sopenharmony_ci    word_dist = dist >> 5;
bf215546Sopenharmony_ci    tmp = NULL;
bf215546Sopenharmony_ci    if (word_dist) {
bf215546Sopenharmony_ci        if (size_words < word_dist)
bf215546Sopenharmony_ci            word_dist = size_words;
bf215546Sopenharmony_ci        tmp = (uint32_t *) (a + index_multiword_lo(size_words, word_dist));
bf215546Sopenharmony_ci        i = word_dist;
bf215546Sopenharmony_ci        do {
bf215546Sopenharmony_ci            word_jam = *tmp++;
bf215546Sopenharmony_ci            if (word_jam)
bf215546Sopenharmony_ci                break;
bf215546Sopenharmony_ci            --i;
bf215546Sopenharmony_ci        } while (i);
bf215546Sopenharmony_ci        tmp = m_out;
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci    if (word_dist < size_words) {
bf215546Sopenharmony_ci        a += index_multiword_hi_but(size_words, word_dist);
bf215546Sopenharmony_ci        inner_dist = dist & 31;
bf215546Sopenharmony_ci        if (inner_dist) {
bf215546Sopenharmony_ci            _mesa_short_shift_right_jam_m(size_words - word_dist, a, inner_dist,
bf215546Sopenharmony_ci                                          m_out + index_multiword_lo_but(size_words, word_dist));
bf215546Sopenharmony_ci            if (!word_dist) {
bf215546Sopenharmony_ci                if (word_jam)
bf215546Sopenharmony_ci                    m_out[index_word_lo(size_words)] |= 1;
bf215546Sopenharmony_ci                return;
bf215546Sopenharmony_ci            }
bf215546Sopenharmony_ci        } else {
bf215546Sopenharmony_ci            a += index_word_lo(size_words - word_dist);
bf215546Sopenharmony_ci            tmp = m_out + index_word_lo(size_words);
bf215546Sopenharmony_ci            for (i = size_words - word_dist; i; --i) {
bf215546Sopenharmony_ci                *tmp = *a;
bf215546Sopenharmony_ci                a += word_incr;
bf215546Sopenharmony_ci                tmp += word_incr;
bf215546Sopenharmony_ci            }
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci        tmp = m_out + index_multiword_hi(size_words, word_dist);
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci    if (tmp) {
bf215546Sopenharmony_ci       do {
bf215546Sopenharmony_ci           *tmp++ = 0;
bf215546Sopenharmony_ci           --word_dist;
bf215546Sopenharmony_ci       } while (word_dist);
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci    if (word_jam)
bf215546Sopenharmony_ci        m_out[index_word_lo(size_words)] |= 1;
bf215546Sopenharmony_ci}
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci/**
bf215546Sopenharmony_ci * \brief Calculate a + b but rounding to zero.
bf215546Sopenharmony_ci *
bf215546Sopenharmony_ci * Notice that this mainly differs from the original Berkeley SoftFloat 3e
bf215546Sopenharmony_ci * implementation in that we don't really treat NaNs, Zeroes nor the
bf215546Sopenharmony_ci * signalling flags. Any NaN is good for us and the sign of the Zero is not
bf215546Sopenharmony_ci * important.
bf215546Sopenharmony_ci *
bf215546Sopenharmony_ci * From f64_add()
bf215546Sopenharmony_ci */
bf215546Sopenharmony_cidouble
bf215546Sopenharmony_ci_mesa_double_add_rtz(double a, double b)
bf215546Sopenharmony_ci{
bf215546Sopenharmony_ci    const di_type a_di = {a};
bf215546Sopenharmony_ci    uint64_t a_flt_m = a_di.u & 0x0fffffffffffff;
bf215546Sopenharmony_ci    uint64_t a_flt_e = (a_di.u >> 52) & 0x7ff;
bf215546Sopenharmony_ci    uint64_t a_flt_s = (a_di.u >> 63) & 0x1;
bf215546Sopenharmony_ci    const di_type b_di = {b};
bf215546Sopenharmony_ci    uint64_t b_flt_m = b_di.u & 0x0fffffffffffff;
bf215546Sopenharmony_ci    uint64_t b_flt_e = (b_di.u >> 52) & 0x7ff;
bf215546Sopenharmony_ci    uint64_t b_flt_s = (b_di.u >> 63) & 0x1;
bf215546Sopenharmony_ci    int64_t s, e, m = 0;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    s = a_flt_s;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    const int64_t exp_diff = a_flt_e - b_flt_e;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    /* Handle special cases */
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    if (a_flt_s != b_flt_s) {
bf215546Sopenharmony_ci        return _mesa_double_sub_rtz(a, -b);
bf215546Sopenharmony_ci    } else if ((a_flt_e == 0) && (a_flt_m == 0)) {
bf215546Sopenharmony_ci        /* 'a' is zero, return 'b' */
bf215546Sopenharmony_ci        return b;
bf215546Sopenharmony_ci    } else if ((b_flt_e == 0) && (b_flt_m == 0)) {
bf215546Sopenharmony_ci        /* 'b' is zero, return 'a' */
bf215546Sopenharmony_ci        return a;
bf215546Sopenharmony_ci    } else if (a_flt_e == 0x7ff && a_flt_m != 0) {
bf215546Sopenharmony_ci        /* 'a' is a NaN, return NaN */
bf215546Sopenharmony_ci        return a;
bf215546Sopenharmony_ci    } else if (b_flt_e == 0x7ff && b_flt_m != 0) {
bf215546Sopenharmony_ci        /* 'b' is a NaN, return NaN */
bf215546Sopenharmony_ci        return b;
bf215546Sopenharmony_ci    } else if (a_flt_e == 0x7ff && a_flt_m == 0) {
bf215546Sopenharmony_ci        /* Inf + x = Inf */
bf215546Sopenharmony_ci        return a;
bf215546Sopenharmony_ci    } else if (b_flt_e == 0x7ff && b_flt_m == 0) {
bf215546Sopenharmony_ci        /* x + Inf = Inf */
bf215546Sopenharmony_ci        return b;
bf215546Sopenharmony_ci    } else if (exp_diff == 0 && a_flt_e == 0) {
bf215546Sopenharmony_ci        di_type result_di;
bf215546Sopenharmony_ci        result_di.u = a_di.u + b_flt_m;
bf215546Sopenharmony_ci        return result_di.f;
bf215546Sopenharmony_ci    } else if (exp_diff == 0) {
bf215546Sopenharmony_ci        e = a_flt_e;
bf215546Sopenharmony_ci        m = 0x0020000000000000 + a_flt_m + b_flt_m;
bf215546Sopenharmony_ci        m <<= 9;
bf215546Sopenharmony_ci    } else if (exp_diff < 0) {
bf215546Sopenharmony_ci        a_flt_m <<= 9;
bf215546Sopenharmony_ci        b_flt_m <<= 9;
bf215546Sopenharmony_ci        e = b_flt_e;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci        if (a_flt_e != 0)
bf215546Sopenharmony_ci            a_flt_m += 0x2000000000000000;
bf215546Sopenharmony_ci        else
bf215546Sopenharmony_ci            a_flt_m <<= 1;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci        a_flt_m = _mesa_shift_right_jam64(a_flt_m, -exp_diff);
bf215546Sopenharmony_ci        m = 0x2000000000000000 + a_flt_m + b_flt_m;
bf215546Sopenharmony_ci        if (m < 0x4000000000000000) {
bf215546Sopenharmony_ci            --e;
bf215546Sopenharmony_ci            m <<= 1;
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci    } else {
bf215546Sopenharmony_ci        a_flt_m <<= 9;
bf215546Sopenharmony_ci        b_flt_m <<= 9;
bf215546Sopenharmony_ci        e = a_flt_e;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci        if (b_flt_e != 0)
bf215546Sopenharmony_ci            b_flt_m += 0x2000000000000000;
bf215546Sopenharmony_ci        else
bf215546Sopenharmony_ci            b_flt_m <<= 1;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci        b_flt_m = _mesa_shift_right_jam64(b_flt_m, exp_diff);
bf215546Sopenharmony_ci        m = 0x2000000000000000 + a_flt_m + b_flt_m;
bf215546Sopenharmony_ci        if (m < 0x4000000000000000) {
bf215546Sopenharmony_ci            --e;
bf215546Sopenharmony_ci            m <<= 1;
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    return _mesa_roundtozero_f64(s, e, m);
bf215546Sopenharmony_ci}
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci/**
bf215546Sopenharmony_ci * \brief Returns the number of leading 0 bits before the most-significant 1 bit of
bf215546Sopenharmony_ci * 'a'.  If 'a' is zero, 64 is returned.
bf215546Sopenharmony_ci */
bf215546Sopenharmony_cistatic inline unsigned
bf215546Sopenharmony_ci_mesa_count_leading_zeros64(uint64_t a)
bf215546Sopenharmony_ci{
bf215546Sopenharmony_ci    return 64 - util_last_bit64(a);
bf215546Sopenharmony_ci}
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci/**
bf215546Sopenharmony_ci * \brief Returns the number of leading 0 bits before the most-significant 1 bit of
bf215546Sopenharmony_ci * 'a'.  If 'a' is zero, 32 is returned.
bf215546Sopenharmony_ci */
bf215546Sopenharmony_cistatic inline unsigned
bf215546Sopenharmony_ci_mesa_count_leading_zeros32(uint32_t a)
bf215546Sopenharmony_ci{
bf215546Sopenharmony_ci    return 32 - util_last_bit(a);
bf215546Sopenharmony_ci}
bf215546Sopenharmony_ci
bf215546Sopenharmony_cistatic inline double
bf215546Sopenharmony_ci_mesa_norm_round_pack_f64(int64_t s, int64_t e, int64_t m)
bf215546Sopenharmony_ci{
bf215546Sopenharmony_ci    int8_t shift_dist;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    shift_dist = _mesa_count_leading_zeros64(m) - 1;
bf215546Sopenharmony_ci    e -= shift_dist;
bf215546Sopenharmony_ci    if ((10 <= shift_dist) && ((unsigned) e < 0x7fd)) {
bf215546Sopenharmony_ci        di_type result;
bf215546Sopenharmony_ci        result.u = (s << 63) + ((m ? e : 0) << 52) + (m << (shift_dist - 10));
bf215546Sopenharmony_ci        return result.f;
bf215546Sopenharmony_ci    } else {
bf215546Sopenharmony_ci        return _mesa_roundtozero_f64(s, e, m << shift_dist);
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci}
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci/**
bf215546Sopenharmony_ci * \brief Replaces the N-bit unsigned integer pointed to by 'm_out' by the
bf215546Sopenharmony_ci * 2s-complement of itself, where N = 'size_words' * 32.  Argument 'm_out'
bf215546Sopenharmony_ci * points to a 'size_words'-long array of 32-bit elements that concatenate in
bf215546Sopenharmony_ci * the platform's normal endian order to form an N-bit integer.
bf215546Sopenharmony_ci *
bf215546Sopenharmony_ci * From softfloat_negXM()
bf215546Sopenharmony_ci */
bf215546Sopenharmony_cistatic inline void
bf215546Sopenharmony_ci_mesa_neg_x_m(uint8_t size_words, uint32_t *m_out)
bf215546Sopenharmony_ci{
bf215546Sopenharmony_ci    unsigned index, last_index;
bf215546Sopenharmony_ci    uint8_t carry;
bf215546Sopenharmony_ci    uint32_t word;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    index = index_word_lo(size_words);
bf215546Sopenharmony_ci    last_index = index_word_hi(size_words);
bf215546Sopenharmony_ci    carry = 1;
bf215546Sopenharmony_ci    for (;;) {
bf215546Sopenharmony_ci        word = ~m_out[index] + carry;
bf215546Sopenharmony_ci        m_out[index] = word;
bf215546Sopenharmony_ci        if (index == last_index)
bf215546Sopenharmony_ci            break;
bf215546Sopenharmony_ci        index += word_incr;
bf215546Sopenharmony_ci        if (word)
bf215546Sopenharmony_ci            carry = 0;
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci}
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci/**
bf215546Sopenharmony_ci * \brief Adds the two N-bit integers pointed to by 'a' and 'b', where N =
bf215546Sopenharmony_ci * 'size_words' * 32.  The addition is modulo 2^N, so any carry out is
bf215546Sopenharmony_ci * lost. The N-bit sum is stored at the location pointed to by 'm_out'.  Each
bf215546Sopenharmony_ci * of 'a', 'b', and 'm_out' points to a 'size_words'-long array of 32-bit
bf215546Sopenharmony_ci * elements that concatenate in the platform's normal endian order to form an
bf215546Sopenharmony_ci * N-bit integer.
bf215546Sopenharmony_ci *
bf215546Sopenharmony_ci * From softfloat_addM()
bf215546Sopenharmony_ci */
bf215546Sopenharmony_cistatic inline void
bf215546Sopenharmony_ci_mesa_add_m(uint8_t size_words, const uint32_t *a, const uint32_t *b, uint32_t *m_out)
bf215546Sopenharmony_ci{
bf215546Sopenharmony_ci    unsigned index, last_index;
bf215546Sopenharmony_ci    uint8_t carry;
bf215546Sopenharmony_ci    uint32_t a_word, word;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    index = index_word_lo(size_words);
bf215546Sopenharmony_ci    last_index = index_word_hi(size_words);
bf215546Sopenharmony_ci    carry = 0;
bf215546Sopenharmony_ci    for (;;) {
bf215546Sopenharmony_ci        a_word = a[index];
bf215546Sopenharmony_ci        word = a_word + b[index] + carry;
bf215546Sopenharmony_ci        m_out[index] = word;
bf215546Sopenharmony_ci        if (index == last_index)
bf215546Sopenharmony_ci            break;
bf215546Sopenharmony_ci        if (word != a_word)
bf215546Sopenharmony_ci            carry = (word < a_word);
bf215546Sopenharmony_ci        index += word_incr;
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci}
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci/**
bf215546Sopenharmony_ci * \brief Subtracts the two N-bit integers pointed to by 'a' and 'b', where N =
bf215546Sopenharmony_ci * 'size_words' * 32.  The subtraction is modulo 2^N, so any borrow out (carry
bf215546Sopenharmony_ci * out) is lost.  The N-bit difference is stored at the location pointed to by
bf215546Sopenharmony_ci * 'm_out'.  Each of 'a', 'b', and 'm_out' points to a 'size_words'-long array
bf215546Sopenharmony_ci * of 32-bit elements that concatenate in the platform's normal endian order
bf215546Sopenharmony_ci * to form an N-bit integer.
bf215546Sopenharmony_ci *
bf215546Sopenharmony_ci * From softfloat_subM()
bf215546Sopenharmony_ci */
bf215546Sopenharmony_cistatic inline void
bf215546Sopenharmony_ci_mesa_sub_m(uint8_t size_words, const uint32_t *a, const uint32_t *b, uint32_t *m_out)
bf215546Sopenharmony_ci{
bf215546Sopenharmony_ci    unsigned index, last_index;
bf215546Sopenharmony_ci    uint8_t borrow;
bf215546Sopenharmony_ci    uint32_t a_word, b_word;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    index = index_word_lo(size_words);
bf215546Sopenharmony_ci    last_index = index_word_hi(size_words);
bf215546Sopenharmony_ci    borrow = 0;
bf215546Sopenharmony_ci    for (;;) {
bf215546Sopenharmony_ci        a_word = a[index];
bf215546Sopenharmony_ci        b_word = b[index];
bf215546Sopenharmony_ci        m_out[index] = a_word - b_word - borrow;
bf215546Sopenharmony_ci        if (index == last_index)
bf215546Sopenharmony_ci            break;
bf215546Sopenharmony_ci        borrow = borrow ? (a_word <= b_word) : (a_word < b_word);
bf215546Sopenharmony_ci        index += word_incr;
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci}
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci/* Calculate a - b but rounding to zero.
bf215546Sopenharmony_ci *
bf215546Sopenharmony_ci * Notice that this mainly differs from the original Berkeley SoftFloat 3e
bf215546Sopenharmony_ci * implementation in that we don't really treat NaNs, Zeroes nor the
bf215546Sopenharmony_ci * signalling flags. Any NaN is good for us and the sign of the Zero is not
bf215546Sopenharmony_ci * important.
bf215546Sopenharmony_ci *
bf215546Sopenharmony_ci * From f64_sub()
bf215546Sopenharmony_ci */
bf215546Sopenharmony_cidouble
bf215546Sopenharmony_ci_mesa_double_sub_rtz(double a, double b)
bf215546Sopenharmony_ci{
bf215546Sopenharmony_ci    const di_type a_di = {a};
bf215546Sopenharmony_ci    uint64_t a_flt_m = a_di.u & 0x0fffffffffffff;
bf215546Sopenharmony_ci    uint64_t a_flt_e = (a_di.u >> 52) & 0x7ff;
bf215546Sopenharmony_ci    uint64_t a_flt_s = (a_di.u >> 63) & 0x1;
bf215546Sopenharmony_ci    const di_type b_di = {b};
bf215546Sopenharmony_ci    uint64_t b_flt_m = b_di.u & 0x0fffffffffffff;
bf215546Sopenharmony_ci    uint64_t b_flt_e = (b_di.u >> 52) & 0x7ff;
bf215546Sopenharmony_ci    uint64_t b_flt_s = (b_di.u >> 63) & 0x1;
bf215546Sopenharmony_ci    int64_t s, e, m = 0;
bf215546Sopenharmony_ci    int64_t m_diff = 0;
bf215546Sopenharmony_ci    unsigned shift_dist = 0;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    s = a_flt_s;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    const int64_t exp_diff = a_flt_e - b_flt_e;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    /* Handle special cases */
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    if (a_flt_s != b_flt_s) {
bf215546Sopenharmony_ci        return _mesa_double_add_rtz(a, -b);
bf215546Sopenharmony_ci    } else if ((a_flt_e == 0) && (a_flt_m == 0)) {
bf215546Sopenharmony_ci        /* 'a' is zero, return '-b' */
bf215546Sopenharmony_ci        return -b;
bf215546Sopenharmony_ci    } else if ((b_flt_e == 0) && (b_flt_m == 0)) {
bf215546Sopenharmony_ci        /* 'b' is zero, return 'a' */
bf215546Sopenharmony_ci        return a;
bf215546Sopenharmony_ci    } else if (a_flt_e == 0x7ff && a_flt_m != 0) {
bf215546Sopenharmony_ci        /* 'a' is a NaN, return NaN */
bf215546Sopenharmony_ci        return a;
bf215546Sopenharmony_ci    } else if (b_flt_e == 0x7ff && b_flt_m != 0) {
bf215546Sopenharmony_ci        /* 'b' is a NaN, return NaN */
bf215546Sopenharmony_ci        return b;
bf215546Sopenharmony_ci    } else if (a_flt_e == 0x7ff && a_flt_m == 0) {
bf215546Sopenharmony_ci        if (b_flt_e == 0x7ff && b_flt_m == 0) {
bf215546Sopenharmony_ci            /* Inf - Inf =  NaN */
bf215546Sopenharmony_ci            di_type result;
bf215546Sopenharmony_ci            e = 0x7ff;
bf215546Sopenharmony_ci            result.u = (s << 63) + (e << 52) + 0x1;
bf215546Sopenharmony_ci            return result.f;
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci        /* Inf - x = Inf */
bf215546Sopenharmony_ci        return a;
bf215546Sopenharmony_ci    } else if (b_flt_e == 0x7ff && b_flt_m == 0) {
bf215546Sopenharmony_ci        /* x - Inf = -Inf */
bf215546Sopenharmony_ci        return -b;
bf215546Sopenharmony_ci    } else if (exp_diff == 0) {
bf215546Sopenharmony_ci        m_diff = a_flt_m - b_flt_m;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci        if (m_diff == 0)
bf215546Sopenharmony_ci            return 0;
bf215546Sopenharmony_ci        if (a_flt_e)
bf215546Sopenharmony_ci            --a_flt_e;
bf215546Sopenharmony_ci        if (m_diff < 0) {
bf215546Sopenharmony_ci            s = !s;
bf215546Sopenharmony_ci            m_diff = -m_diff;
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci        shift_dist = _mesa_count_leading_zeros64(m_diff) - 11;
bf215546Sopenharmony_ci        e = a_flt_e - shift_dist;
bf215546Sopenharmony_ci        if (e < 0) {
bf215546Sopenharmony_ci            shift_dist = a_flt_e;
bf215546Sopenharmony_ci            e = 0;
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci        di_type result;
bf215546Sopenharmony_ci        result.u = (s << 63) + (e << 52) + (m_diff << shift_dist);
bf215546Sopenharmony_ci        return result.f;
bf215546Sopenharmony_ci    } else if (exp_diff < 0) {
bf215546Sopenharmony_ci        a_flt_m <<= 10;
bf215546Sopenharmony_ci        b_flt_m <<= 10;
bf215546Sopenharmony_ci        s = !s;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci        a_flt_m += (a_flt_e) ? 0x4000000000000000 : a_flt_m;
bf215546Sopenharmony_ci        a_flt_m = _mesa_shift_right_jam64(a_flt_m, -exp_diff);
bf215546Sopenharmony_ci        b_flt_m |= 0x4000000000000000;
bf215546Sopenharmony_ci        e = b_flt_e;
bf215546Sopenharmony_ci        m = b_flt_m - a_flt_m;
bf215546Sopenharmony_ci    } else {
bf215546Sopenharmony_ci        a_flt_m <<= 10;
bf215546Sopenharmony_ci        b_flt_m <<= 10;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci        b_flt_m += (b_flt_e) ? 0x4000000000000000 : b_flt_m;
bf215546Sopenharmony_ci        b_flt_m = _mesa_shift_right_jam64(b_flt_m, exp_diff);
bf215546Sopenharmony_ci        a_flt_m |= 0x4000000000000000;
bf215546Sopenharmony_ci        e = a_flt_e;
bf215546Sopenharmony_ci        m = a_flt_m - b_flt_m;
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    return _mesa_norm_round_pack_f64(s, e - 1, m);
bf215546Sopenharmony_ci}
bf215546Sopenharmony_ci
bf215546Sopenharmony_cistatic inline void
bf215546Sopenharmony_ci_mesa_norm_subnormal_mantissa_f64(uint64_t m, uint64_t *exp, uint64_t *m_out)
bf215546Sopenharmony_ci{
bf215546Sopenharmony_ci    int shift_dist;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    shift_dist = _mesa_count_leading_zeros64(m) - 11;
bf215546Sopenharmony_ci    *exp = 1 - shift_dist;
bf215546Sopenharmony_ci    *m_out = m << shift_dist;
bf215546Sopenharmony_ci}
bf215546Sopenharmony_ci
bf215546Sopenharmony_cistatic inline void
bf215546Sopenharmony_ci_mesa_norm_subnormal_mantissa_f32(uint32_t m, uint32_t *exp, uint32_t *m_out)
bf215546Sopenharmony_ci{
bf215546Sopenharmony_ci    int shift_dist;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    shift_dist = _mesa_count_leading_zeros32(m) - 8;
bf215546Sopenharmony_ci    *exp = 1 - shift_dist;
bf215546Sopenharmony_ci    *m_out = m << shift_dist;
bf215546Sopenharmony_ci}
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci/**
bf215546Sopenharmony_ci * \brief Multiplies 'a' and 'b' and stores the 128-bit product at the location
bf215546Sopenharmony_ci * pointed to by 'zPtr'.  Argument 'zPtr' points to an array of four 32-bit
bf215546Sopenharmony_ci * elements that concatenate in the platform's normal endian order to form a
bf215546Sopenharmony_ci * 128-bit integer.
bf215546Sopenharmony_ci *
bf215546Sopenharmony_ci * From softfloat_mul64To128M()
bf215546Sopenharmony_ci */
bf215546Sopenharmony_cistatic inline void
bf215546Sopenharmony_ci_mesa_softfloat_mul_f64_to_f128_m(uint64_t a, uint64_t b, uint32_t *m_out)
bf215546Sopenharmony_ci{
bf215546Sopenharmony_ci    uint32_t a32, a0, b32, b0;
bf215546Sopenharmony_ci    uint64_t z0, mid1, z64, mid;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    a32 = a >> 32;
bf215546Sopenharmony_ci    a0 = a;
bf215546Sopenharmony_ci    b32 = b >> 32;
bf215546Sopenharmony_ci    b0 = b;
bf215546Sopenharmony_ci    z0 = (uint64_t) a0 * b0;
bf215546Sopenharmony_ci    mid1 = (uint64_t) a32 * b0;
bf215546Sopenharmony_ci    mid = mid1 + (uint64_t) a0 * b32;
bf215546Sopenharmony_ci    z64 = (uint64_t) a32 * b32;
bf215546Sopenharmony_ci    z64 += (uint64_t) (mid < mid1) << 32 | mid >> 32;
bf215546Sopenharmony_ci    mid <<= 32;
bf215546Sopenharmony_ci    z0 += mid;
bf215546Sopenharmony_ci    m_out[index_word(4, 1)] = z0 >> 32;
bf215546Sopenharmony_ci    m_out[index_word(4, 0)] = z0;
bf215546Sopenharmony_ci    z64 += (z0 < mid);
bf215546Sopenharmony_ci    m_out[index_word(4, 3)] = z64 >> 32;
bf215546Sopenharmony_ci    m_out[index_word(4, 2)] = z64;
bf215546Sopenharmony_ci}
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci/* Calculate a * b but rounding to zero.
bf215546Sopenharmony_ci *
bf215546Sopenharmony_ci * Notice that this mainly differs from the original Berkeley SoftFloat 3e
bf215546Sopenharmony_ci * implementation in that we don't really treat NaNs, Zeroes nor the
bf215546Sopenharmony_ci * signalling flags. Any NaN is good for us and the sign of the Zero is not
bf215546Sopenharmony_ci * important.
bf215546Sopenharmony_ci *
bf215546Sopenharmony_ci * From f64_mul()
bf215546Sopenharmony_ci */
bf215546Sopenharmony_cidouble
bf215546Sopenharmony_ci_mesa_double_mul_rtz(double a, double b)
bf215546Sopenharmony_ci{
bf215546Sopenharmony_ci    const di_type a_di = {a};
bf215546Sopenharmony_ci    uint64_t a_flt_m = a_di.u & 0x0fffffffffffff;
bf215546Sopenharmony_ci    uint64_t a_flt_e = (a_di.u >> 52) & 0x7ff;
bf215546Sopenharmony_ci    uint64_t a_flt_s = (a_di.u >> 63) & 0x1;
bf215546Sopenharmony_ci    const di_type b_di = {b};
bf215546Sopenharmony_ci    uint64_t b_flt_m = b_di.u & 0x0fffffffffffff;
bf215546Sopenharmony_ci    uint64_t b_flt_e = (b_di.u >> 52) & 0x7ff;
bf215546Sopenharmony_ci    uint64_t b_flt_s = (b_di.u >> 63) & 0x1;
bf215546Sopenharmony_ci    int64_t s, e, m = 0;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    s = a_flt_s ^ b_flt_s;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    if (a_flt_e == 0x7ff) {
bf215546Sopenharmony_ci        if (a_flt_m != 0) {
bf215546Sopenharmony_ci            /* 'a' is a NaN, return NaN */
bf215546Sopenharmony_ci            return a;
bf215546Sopenharmony_ci        } else if (b_flt_e == 0x7ff && b_flt_m != 0) {
bf215546Sopenharmony_ci            /* 'b' is a NaN, return NaN */
bf215546Sopenharmony_ci            return b;
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci        if (!(b_flt_e | b_flt_m)) {
bf215546Sopenharmony_ci            /* Inf * 0 = NaN */
bf215546Sopenharmony_ci            di_type result;
bf215546Sopenharmony_ci            e = 0x7ff;
bf215546Sopenharmony_ci            result.u = (s << 63) + (e << 52) + 0x1;
bf215546Sopenharmony_ci            return result.f;
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci        /* Inf * x = Inf */
bf215546Sopenharmony_ci        di_type result;
bf215546Sopenharmony_ci        e = 0x7ff;
bf215546Sopenharmony_ci        result.u = (s << 63) + (e << 52) + 0;
bf215546Sopenharmony_ci        return result.f;
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    if (b_flt_e == 0x7ff) {
bf215546Sopenharmony_ci        if (b_flt_m != 0) {
bf215546Sopenharmony_ci            /* 'b' is a NaN, return NaN */
bf215546Sopenharmony_ci            return b;
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci        if (!(a_flt_e | a_flt_m)) {
bf215546Sopenharmony_ci            /* 0 * Inf = NaN */
bf215546Sopenharmony_ci            di_type result;
bf215546Sopenharmony_ci            e = 0x7ff;
bf215546Sopenharmony_ci            result.u = (s << 63) + (e << 52) + 0x1;
bf215546Sopenharmony_ci            return result.f;
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci        /* x * Inf = Inf */
bf215546Sopenharmony_ci        di_type result;
bf215546Sopenharmony_ci        e = 0x7ff;
bf215546Sopenharmony_ci        result.u = (s << 63) + (e << 52) + 0;
bf215546Sopenharmony_ci        return result.f;
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    if (a_flt_e == 0) {
bf215546Sopenharmony_ci        if (a_flt_m == 0) {
bf215546Sopenharmony_ci            /* 'a' is zero. Return zero */
bf215546Sopenharmony_ci            di_type result;
bf215546Sopenharmony_ci            result.u = (s << 63) + 0;
bf215546Sopenharmony_ci            return result.f;
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci        _mesa_norm_subnormal_mantissa_f64(a_flt_m , &a_flt_e, &a_flt_m);
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci    if (b_flt_e == 0) {
bf215546Sopenharmony_ci        if (b_flt_m == 0) {
bf215546Sopenharmony_ci            /* 'b' is zero. Return zero */
bf215546Sopenharmony_ci            di_type result;
bf215546Sopenharmony_ci            result.u = (s << 63) + 0;
bf215546Sopenharmony_ci            return result.f;
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci        _mesa_norm_subnormal_mantissa_f64(b_flt_m , &b_flt_e, &b_flt_m);
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    e = a_flt_e + b_flt_e - 0x3ff;
bf215546Sopenharmony_ci    a_flt_m = (a_flt_m | 0x0010000000000000) << 10;
bf215546Sopenharmony_ci    b_flt_m = (b_flt_m | 0x0010000000000000) << 11;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    uint32_t m_128[4];
bf215546Sopenharmony_ci    _mesa_softfloat_mul_f64_to_f128_m(a_flt_m, b_flt_m, m_128);
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    m = (uint64_t) m_128[index_word(4, 3)] << 32 | m_128[index_word(4, 2)];
bf215546Sopenharmony_ci    if (m_128[index_word(4, 1)] || m_128[index_word(4, 0)])
bf215546Sopenharmony_ci        m |= 1;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    if (m < 0x4000000000000000) {
bf215546Sopenharmony_ci        --e;
bf215546Sopenharmony_ci        m <<= 1;
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    return _mesa_roundtozero_f64(s, e, m);
bf215546Sopenharmony_ci}
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci/**
bf215546Sopenharmony_ci * \brief Calculate a * b + c but rounding to zero.
bf215546Sopenharmony_ci *
bf215546Sopenharmony_ci * Notice that this mainly differs from the original Berkeley SoftFloat 3e
bf215546Sopenharmony_ci * implementation in that we don't really treat NaNs, Zeroes nor the
bf215546Sopenharmony_ci * signalling flags. Any NaN is good for us and the sign of the Zero is not
bf215546Sopenharmony_ci * important.
bf215546Sopenharmony_ci *
bf215546Sopenharmony_ci * From f64_mulAdd()
bf215546Sopenharmony_ci */
bf215546Sopenharmony_cidouble
bf215546Sopenharmony_ci_mesa_double_fma_rtz(double a, double b, double c)
bf215546Sopenharmony_ci{
bf215546Sopenharmony_ci    const di_type a_di = {a};
bf215546Sopenharmony_ci    uint64_t a_flt_m = a_di.u & 0x0fffffffffffff;
bf215546Sopenharmony_ci    uint64_t a_flt_e = (a_di.u >> 52) & 0x7ff;
bf215546Sopenharmony_ci    uint64_t a_flt_s = (a_di.u >> 63) & 0x1;
bf215546Sopenharmony_ci    const di_type b_di = {b};
bf215546Sopenharmony_ci    uint64_t b_flt_m = b_di.u & 0x0fffffffffffff;
bf215546Sopenharmony_ci    uint64_t b_flt_e = (b_di.u >> 52) & 0x7ff;
bf215546Sopenharmony_ci    uint64_t b_flt_s = (b_di.u >> 63) & 0x1;
bf215546Sopenharmony_ci    const di_type c_di = {c};
bf215546Sopenharmony_ci    uint64_t c_flt_m = c_di.u & 0x0fffffffffffff;
bf215546Sopenharmony_ci    uint64_t c_flt_e = (c_di.u >> 52) & 0x7ff;
bf215546Sopenharmony_ci    uint64_t c_flt_s = (c_di.u >> 63) & 0x1;
bf215546Sopenharmony_ci    int64_t s, e, m = 0;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    c_flt_s ^= 0;
bf215546Sopenharmony_ci    s = a_flt_s ^ b_flt_s ^ 0;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    if (a_flt_e == 0x7ff) {
bf215546Sopenharmony_ci        if (a_flt_m != 0) {
bf215546Sopenharmony_ci            /* 'a' is a NaN, return NaN */
bf215546Sopenharmony_ci            return a;
bf215546Sopenharmony_ci        } else if (b_flt_e == 0x7ff && b_flt_m != 0) {
bf215546Sopenharmony_ci            /* 'b' is a NaN, return NaN */
bf215546Sopenharmony_ci            return b;
bf215546Sopenharmony_ci        } else if (c_flt_e == 0x7ff && c_flt_m != 0) {
bf215546Sopenharmony_ci            /* 'c' is a NaN, return NaN */
bf215546Sopenharmony_ci            return c;
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci        if (!(b_flt_e | b_flt_m)) {
bf215546Sopenharmony_ci            /* Inf * 0 + y = NaN */
bf215546Sopenharmony_ci            di_type result;
bf215546Sopenharmony_ci            e = 0x7ff;
bf215546Sopenharmony_ci            result.u = (s << 63) + (e << 52) + 0x1;
bf215546Sopenharmony_ci            return result.f;
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci        if ((c_flt_e == 0x7ff && c_flt_m == 0) && (s != c_flt_s)) {
bf215546Sopenharmony_ci            /* Inf * x - Inf = NaN */
bf215546Sopenharmony_ci            di_type result;
bf215546Sopenharmony_ci            e = 0x7ff;
bf215546Sopenharmony_ci            result.u = (s << 63) + (e << 52) + 0x1;
bf215546Sopenharmony_ci            return result.f;
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci        /* Inf * x + y = Inf */
bf215546Sopenharmony_ci        di_type result;
bf215546Sopenharmony_ci        e = 0x7ff;
bf215546Sopenharmony_ci        result.u = (s << 63) + (e << 52) + 0;
bf215546Sopenharmony_ci        return result.f;
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    if (b_flt_e == 0x7ff) {
bf215546Sopenharmony_ci        if (b_flt_m != 0) {
bf215546Sopenharmony_ci            /* 'b' is a NaN, return NaN */
bf215546Sopenharmony_ci            return b;
bf215546Sopenharmony_ci        } else if (c_flt_e == 0x7ff && c_flt_m != 0) {
bf215546Sopenharmony_ci            /* 'c' is a NaN, return NaN */
bf215546Sopenharmony_ci            return c;
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci        if (!(a_flt_e | a_flt_m)) {
bf215546Sopenharmony_ci            /* 0 * Inf + y = NaN */
bf215546Sopenharmony_ci            di_type result;
bf215546Sopenharmony_ci            e = 0x7ff;
bf215546Sopenharmony_ci            result.u = (s << 63) + (e << 52) + 0x1;
bf215546Sopenharmony_ci            return result.f;
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci        if ((c_flt_e == 0x7ff && c_flt_m == 0) && (s != c_flt_s)) {
bf215546Sopenharmony_ci            /* x * Inf - Inf = NaN */
bf215546Sopenharmony_ci            di_type result;
bf215546Sopenharmony_ci            e = 0x7ff;
bf215546Sopenharmony_ci            result.u = (s << 63) + (e << 52) + 0x1;
bf215546Sopenharmony_ci            return result.f;
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci        /* x * Inf + y = Inf */
bf215546Sopenharmony_ci        di_type result;
bf215546Sopenharmony_ci        e = 0x7ff;
bf215546Sopenharmony_ci        result.u = (s << 63) + (e << 52) + 0;
bf215546Sopenharmony_ci        return result.f;
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    if (c_flt_e == 0x7ff) {
bf215546Sopenharmony_ci        if (c_flt_m != 0) {
bf215546Sopenharmony_ci            /* 'c' is a NaN, return NaN */
bf215546Sopenharmony_ci            return c;
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci        /* x * y + Inf = Inf */
bf215546Sopenharmony_ci        return c;
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    if (a_flt_e == 0) {
bf215546Sopenharmony_ci        if (a_flt_m == 0) {
bf215546Sopenharmony_ci            /* 'a' is zero, return 'c' */
bf215546Sopenharmony_ci            return c;
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci        _mesa_norm_subnormal_mantissa_f64(a_flt_m , &a_flt_e, &a_flt_m);
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    if (b_flt_e == 0) {
bf215546Sopenharmony_ci        if (b_flt_m == 0) {
bf215546Sopenharmony_ci            /* 'b' is zero, return 'c' */
bf215546Sopenharmony_ci            return c;
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci        _mesa_norm_subnormal_mantissa_f64(b_flt_m , &b_flt_e, &b_flt_m);
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    e = a_flt_e + b_flt_e - 0x3fe;
bf215546Sopenharmony_ci    a_flt_m = (a_flt_m | 0x0010000000000000) << 10;
bf215546Sopenharmony_ci    b_flt_m = (b_flt_m | 0x0010000000000000) << 11;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    uint32_t m_128[4];
bf215546Sopenharmony_ci    _mesa_softfloat_mul_f64_to_f128_m(a_flt_m, b_flt_m, m_128);
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    m = (uint64_t) m_128[index_word(4, 3)] << 32 | m_128[index_word(4, 2)];
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    int64_t shift_dist = 0;
bf215546Sopenharmony_ci    if (!(m & 0x4000000000000000)) {
bf215546Sopenharmony_ci        --e;
bf215546Sopenharmony_ci        shift_dist = -1;
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    if (c_flt_e == 0) {
bf215546Sopenharmony_ci        if (c_flt_m == 0) {
bf215546Sopenharmony_ci            /* 'c' is zero, return 'a * b' */
bf215546Sopenharmony_ci            if (shift_dist)
bf215546Sopenharmony_ci                m <<= 1;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci            if (m_128[index_word(4, 1)] || m_128[index_word(4, 0)])
bf215546Sopenharmony_ci                m |= 1;
bf215546Sopenharmony_ci            return _mesa_roundtozero_f64(s, e - 1, m);
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci        _mesa_norm_subnormal_mantissa_f64(c_flt_m , &c_flt_e, &c_flt_m);
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci    c_flt_m = (c_flt_m | 0x0010000000000000) << 10;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    uint32_t c_flt_m_128[4];
bf215546Sopenharmony_ci    int64_t exp_diff = e - c_flt_e;
bf215546Sopenharmony_ci    if (exp_diff < 0) {
bf215546Sopenharmony_ci        e = c_flt_e;
bf215546Sopenharmony_ci        if ((s == c_flt_s) || (exp_diff < -1)) {
bf215546Sopenharmony_ci            shift_dist -= exp_diff;
bf215546Sopenharmony_ci            if (shift_dist) {
bf215546Sopenharmony_ci                m = _mesa_shift_right_jam64(m, shift_dist);
bf215546Sopenharmony_ci            }
bf215546Sopenharmony_ci        } else {
bf215546Sopenharmony_ci            if (!shift_dist) {
bf215546Sopenharmony_ci                _mesa_short_shift_right_m(4, m_128, 1, m_128);
bf215546Sopenharmony_ci            }
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci    } else {
bf215546Sopenharmony_ci        if (shift_dist)
bf215546Sopenharmony_ci            _mesa_add_m(4, m_128, m_128, m_128);
bf215546Sopenharmony_ci        if (!exp_diff) {
bf215546Sopenharmony_ci            m = (uint64_t) m_128[index_word(4, 3)] << 32
bf215546Sopenharmony_ci                | m_128[index_word(4, 2)];
bf215546Sopenharmony_ci        } else {
bf215546Sopenharmony_ci            c_flt_m_128[index_word(4, 3)] = c_flt_m >> 32;
bf215546Sopenharmony_ci            c_flt_m_128[index_word(4, 2)] = c_flt_m;
bf215546Sopenharmony_ci            c_flt_m_128[index_word(4, 1)] = 0;
bf215546Sopenharmony_ci            c_flt_m_128[index_word(4, 0)] = 0;
bf215546Sopenharmony_ci            _mesa_shift_right_jam_m(4, c_flt_m_128, exp_diff, c_flt_m_128);
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    if (s == c_flt_s) {
bf215546Sopenharmony_ci        if (exp_diff <= 0) {
bf215546Sopenharmony_ci            m += c_flt_m;
bf215546Sopenharmony_ci        } else {
bf215546Sopenharmony_ci            _mesa_add_m(4, m_128, c_flt_m_128, m_128);
bf215546Sopenharmony_ci            m = (uint64_t) m_128[index_word(4, 3)] << 32
bf215546Sopenharmony_ci                | m_128[index_word(4, 2)];
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci        if (m & 0x8000000000000000) {
bf215546Sopenharmony_ci            e++;
bf215546Sopenharmony_ci            m = _mesa_short_shift_right_jam64(m, 1);
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci    } else {
bf215546Sopenharmony_ci        if (exp_diff < 0) {
bf215546Sopenharmony_ci            s = c_flt_s;
bf215546Sopenharmony_ci            if (exp_diff < -1) {
bf215546Sopenharmony_ci                m = c_flt_m - m;
bf215546Sopenharmony_ci                if (m_128[index_word(4, 1)] || m_128[index_word(4, 0)]) {
bf215546Sopenharmony_ci                    m = (m - 1) | 1;
bf215546Sopenharmony_ci                }
bf215546Sopenharmony_ci                if (!(m & 0x4000000000000000)) {
bf215546Sopenharmony_ci                    --e;
bf215546Sopenharmony_ci                    m <<= 1;
bf215546Sopenharmony_ci                }
bf215546Sopenharmony_ci                return _mesa_roundtozero_f64(s, e - 1, m);
bf215546Sopenharmony_ci            } else {
bf215546Sopenharmony_ci                c_flt_m_128[index_word(4, 3)] = c_flt_m >> 32;
bf215546Sopenharmony_ci                c_flt_m_128[index_word(4, 2)] = c_flt_m;
bf215546Sopenharmony_ci                c_flt_m_128[index_word(4, 1)] = 0;
bf215546Sopenharmony_ci                c_flt_m_128[index_word(4, 0)] = 0;
bf215546Sopenharmony_ci                _mesa_sub_m(4, c_flt_m_128, m_128, m_128);
bf215546Sopenharmony_ci            }
bf215546Sopenharmony_ci        } else if (!exp_diff) {
bf215546Sopenharmony_ci            m -= c_flt_m;
bf215546Sopenharmony_ci            if (!m && !m_128[index_word(4, 1)] && !m_128[index_word(4, 0)]) {
bf215546Sopenharmony_ci                /* Return zero */
bf215546Sopenharmony_ci                di_type result;
bf215546Sopenharmony_ci                result.u = (s << 63) + 0;
bf215546Sopenharmony_ci                return result.f;
bf215546Sopenharmony_ci            }
bf215546Sopenharmony_ci            m_128[index_word(4, 3)] = m >> 32;
bf215546Sopenharmony_ci            m_128[index_word(4, 2)] = m;
bf215546Sopenharmony_ci            if (m & 0x8000000000000000) {
bf215546Sopenharmony_ci                s = !s;
bf215546Sopenharmony_ci                _mesa_neg_x_m(4, m_128);
bf215546Sopenharmony_ci            }
bf215546Sopenharmony_ci        } else {
bf215546Sopenharmony_ci            _mesa_sub_m(4, m_128, c_flt_m_128, m_128);
bf215546Sopenharmony_ci            if (1 < exp_diff) {
bf215546Sopenharmony_ci                m = (uint64_t) m_128[index_word(4, 3)] << 32
bf215546Sopenharmony_ci                    | m_128[index_word(4, 2)];
bf215546Sopenharmony_ci                if (!(m & 0x4000000000000000)) {
bf215546Sopenharmony_ci                    --e;
bf215546Sopenharmony_ci                    m <<= 1;
bf215546Sopenharmony_ci                }
bf215546Sopenharmony_ci                if (m_128[index_word(4, 1)] || m_128[index_word(4, 0)])
bf215546Sopenharmony_ci                    m |= 1;
bf215546Sopenharmony_ci                return _mesa_roundtozero_f64(s, e - 1, m);
bf215546Sopenharmony_ci            }
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci        shift_dist = 0;
bf215546Sopenharmony_ci        m = (uint64_t) m_128[index_word(4, 3)] << 32
bf215546Sopenharmony_ci            | m_128[index_word(4, 2)];
bf215546Sopenharmony_ci        if (!m) {
bf215546Sopenharmony_ci            shift_dist = 64;
bf215546Sopenharmony_ci            m = (uint64_t) m_128[index_word(4, 1)] << 32
bf215546Sopenharmony_ci                | m_128[index_word(4, 0)];
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci        shift_dist += _mesa_count_leading_zeros64(m) - 1;
bf215546Sopenharmony_ci        if (shift_dist) {
bf215546Sopenharmony_ci            e -= shift_dist;
bf215546Sopenharmony_ci            _mesa_shift_left_m(4, m_128, shift_dist, m_128);
bf215546Sopenharmony_ci            m = (uint64_t) m_128[index_word(4, 3)] << 32
bf215546Sopenharmony_ci                | m_128[index_word(4, 2)];
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    if (m_128[index_word(4, 1)] || m_128[index_word(4, 0)])
bf215546Sopenharmony_ci        m |= 1;
bf215546Sopenharmony_ci    return _mesa_roundtozero_f64(s, e - 1, m);
bf215546Sopenharmony_ci}
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci/**
bf215546Sopenharmony_ci * \brief Calculate a * b + c but rounding to zero.
bf215546Sopenharmony_ci *
bf215546Sopenharmony_ci * Notice that this mainly differs from the original Berkeley SoftFloat 3e
bf215546Sopenharmony_ci * implementation in that we don't really treat NaNs, Zeroes nor the
bf215546Sopenharmony_ci * signalling flags. Any NaN is good for us and the sign of the Zero is not
bf215546Sopenharmony_ci * important.
bf215546Sopenharmony_ci *
bf215546Sopenharmony_ci * From f32_mulAdd()
bf215546Sopenharmony_ci */
bf215546Sopenharmony_cifloat
bf215546Sopenharmony_ci_mesa_float_fma_rtz(float a, float b, float c)
bf215546Sopenharmony_ci{
bf215546Sopenharmony_ci    const fi_type a_fi = {a};
bf215546Sopenharmony_ci    uint32_t a_flt_m = a_fi.u & 0x07fffff;
bf215546Sopenharmony_ci    uint32_t a_flt_e = (a_fi.u >> 23) & 0xff;
bf215546Sopenharmony_ci    uint32_t a_flt_s = (a_fi.u >> 31) & 0x1;
bf215546Sopenharmony_ci    const fi_type b_fi = {b};
bf215546Sopenharmony_ci    uint32_t b_flt_m = b_fi.u & 0x07fffff;
bf215546Sopenharmony_ci    uint32_t b_flt_e = (b_fi.u >> 23) & 0xff;
bf215546Sopenharmony_ci    uint32_t b_flt_s = (b_fi.u >> 31) & 0x1;
bf215546Sopenharmony_ci    const fi_type c_fi = {c};
bf215546Sopenharmony_ci    uint32_t c_flt_m = c_fi.u & 0x07fffff;
bf215546Sopenharmony_ci    uint32_t c_flt_e = (c_fi.u >> 23) & 0xff;
bf215546Sopenharmony_ci    uint32_t c_flt_s = (c_fi.u >> 31) & 0x1;
bf215546Sopenharmony_ci    int32_t s, e, m = 0;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    c_flt_s ^= 0;
bf215546Sopenharmony_ci    s = a_flt_s ^ b_flt_s ^ 0;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    if (a_flt_e == 0xff) {
bf215546Sopenharmony_ci        if (a_flt_m != 0) {
bf215546Sopenharmony_ci            /* 'a' is a NaN, return NaN */
bf215546Sopenharmony_ci            return a;
bf215546Sopenharmony_ci        } else if (b_flt_e == 0xff && b_flt_m != 0) {
bf215546Sopenharmony_ci            /* 'b' is a NaN, return NaN */
bf215546Sopenharmony_ci            return b;
bf215546Sopenharmony_ci        } else if (c_flt_e == 0xff && c_flt_m != 0) {
bf215546Sopenharmony_ci            /* 'c' is a NaN, return NaN */
bf215546Sopenharmony_ci            return c;
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci        if (!(b_flt_e | b_flt_m)) {
bf215546Sopenharmony_ci            /* Inf * 0 + y = NaN */
bf215546Sopenharmony_ci            fi_type result;
bf215546Sopenharmony_ci            e = 0xff;
bf215546Sopenharmony_ci            result.u = (s << 31) + (e << 23) + 0x1;
bf215546Sopenharmony_ci            return result.f;
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci        if ((c_flt_e == 0xff && c_flt_m == 0) && (s != c_flt_s)) {
bf215546Sopenharmony_ci            /* Inf * x - Inf = NaN */
bf215546Sopenharmony_ci            fi_type result;
bf215546Sopenharmony_ci            e = 0xff;
bf215546Sopenharmony_ci            result.u = (s << 31) + (e << 23) + 0x1;
bf215546Sopenharmony_ci            return result.f;
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci        /* Inf * x + y = Inf */
bf215546Sopenharmony_ci        fi_type result;
bf215546Sopenharmony_ci        e = 0xff;
bf215546Sopenharmony_ci        result.u = (s << 31) + (e << 23) + 0;
bf215546Sopenharmony_ci        return result.f;
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    if (b_flt_e == 0xff) {
bf215546Sopenharmony_ci        if (b_flt_m != 0) {
bf215546Sopenharmony_ci            /* 'b' is a NaN, return NaN */
bf215546Sopenharmony_ci            return b;
bf215546Sopenharmony_ci        } else if (c_flt_e == 0xff && c_flt_m != 0) {
bf215546Sopenharmony_ci            /* 'c' is a NaN, return NaN */
bf215546Sopenharmony_ci            return c;
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci        if (!(a_flt_e | a_flt_m)) {
bf215546Sopenharmony_ci            /* 0 * Inf + y = NaN */
bf215546Sopenharmony_ci            fi_type result;
bf215546Sopenharmony_ci            e = 0xff;
bf215546Sopenharmony_ci            result.u = (s << 31) + (e << 23) + 0x1;
bf215546Sopenharmony_ci            return result.f;
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci        if ((c_flt_e == 0xff && c_flt_m == 0) && (s != c_flt_s)) {
bf215546Sopenharmony_ci            /* x * Inf - Inf = NaN */
bf215546Sopenharmony_ci            fi_type result;
bf215546Sopenharmony_ci            e = 0xff;
bf215546Sopenharmony_ci            result.u = (s << 31) + (e << 23) + 0x1;
bf215546Sopenharmony_ci            return result.f;
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci        /* x * Inf + y = Inf */
bf215546Sopenharmony_ci        fi_type result;
bf215546Sopenharmony_ci        e = 0xff;
bf215546Sopenharmony_ci        result.u = (s << 31) + (e << 23) + 0;
bf215546Sopenharmony_ci        return result.f;
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    if (c_flt_e == 0xff) {
bf215546Sopenharmony_ci        if (c_flt_m != 0) {
bf215546Sopenharmony_ci            /* 'c' is a NaN, return NaN */
bf215546Sopenharmony_ci            return c;
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci        /* x * y + Inf = Inf */
bf215546Sopenharmony_ci        return c;
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    if (a_flt_e == 0) {
bf215546Sopenharmony_ci        if (a_flt_m == 0) {
bf215546Sopenharmony_ci            /* 'a' is zero, return 'c' */
bf215546Sopenharmony_ci            return c;
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci        _mesa_norm_subnormal_mantissa_f32(a_flt_m , &a_flt_e, &a_flt_m);
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    if (b_flt_e == 0) {
bf215546Sopenharmony_ci        if (b_flt_m == 0) {
bf215546Sopenharmony_ci            /* 'b' is zero, return 'c' */
bf215546Sopenharmony_ci            return c;
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci        _mesa_norm_subnormal_mantissa_f32(b_flt_m , &b_flt_e, &b_flt_m);
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    e = a_flt_e + b_flt_e - 0x7e;
bf215546Sopenharmony_ci    a_flt_m = (a_flt_m | 0x00800000) << 7;
bf215546Sopenharmony_ci    b_flt_m = (b_flt_m | 0x00800000) << 7;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    uint64_t m_64 = (uint64_t) a_flt_m * b_flt_m;
bf215546Sopenharmony_ci    if (m_64 < 0x2000000000000000) {
bf215546Sopenharmony_ci        --e;
bf215546Sopenharmony_ci        m_64 <<= 1;
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    if (c_flt_e == 0) {
bf215546Sopenharmony_ci        if (c_flt_m == 0) {
bf215546Sopenharmony_ci            /* 'c' is zero, return 'a * b' */
bf215546Sopenharmony_ci            m = _mesa_short_shift_right_jam64(m_64, 31);
bf215546Sopenharmony_ci            return _mesa_round_f32(s, e - 1, m, true);
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci        _mesa_norm_subnormal_mantissa_f32(c_flt_m , &c_flt_e, &c_flt_m);
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci    c_flt_m = (c_flt_m | 0x00800000) << 6;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    int16_t exp_diff = e - c_flt_e;
bf215546Sopenharmony_ci    if (s == c_flt_s) {
bf215546Sopenharmony_ci        if (exp_diff <= 0) {
bf215546Sopenharmony_ci            e = c_flt_e;
bf215546Sopenharmony_ci            m = c_flt_m + _mesa_shift_right_jam64(m_64, 32 - exp_diff);
bf215546Sopenharmony_ci        } else {
bf215546Sopenharmony_ci            m_64 += _mesa_shift_right_jam64((uint64_t) c_flt_m << 32, exp_diff);
bf215546Sopenharmony_ci            m = _mesa_short_shift_right_jam64(m_64, 32);
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci        if (m < 0x40000000) {
bf215546Sopenharmony_ci            --e;
bf215546Sopenharmony_ci            m <<= 1;
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci    } else {
bf215546Sopenharmony_ci        uint64_t c_flt_m_64 = (uint64_t) c_flt_m << 32;
bf215546Sopenharmony_ci        if (exp_diff < 0) {
bf215546Sopenharmony_ci            s = c_flt_s;
bf215546Sopenharmony_ci            e = c_flt_e;
bf215546Sopenharmony_ci            m_64 = c_flt_m_64 - _mesa_shift_right_jam64(m_64, -exp_diff);
bf215546Sopenharmony_ci        } else if (!exp_diff) {
bf215546Sopenharmony_ci            m_64 -= c_flt_m_64;
bf215546Sopenharmony_ci            if (!m_64) {
bf215546Sopenharmony_ci                /* Return zero */
bf215546Sopenharmony_ci                fi_type result;
bf215546Sopenharmony_ci                result.u = (s << 31) + 0;
bf215546Sopenharmony_ci                return result.f;
bf215546Sopenharmony_ci            }
bf215546Sopenharmony_ci            if (m_64 & 0x8000000000000000) {
bf215546Sopenharmony_ci                s = !s;
bf215546Sopenharmony_ci                m_64 = -m_64;
bf215546Sopenharmony_ci            }
bf215546Sopenharmony_ci        } else {
bf215546Sopenharmony_ci            m_64 -= _mesa_shift_right_jam64(c_flt_m_64, exp_diff);
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci        int8_t shift_dist = _mesa_count_leading_zeros64(m_64) - 1;
bf215546Sopenharmony_ci        e -= shift_dist;
bf215546Sopenharmony_ci        shift_dist -= 32;
bf215546Sopenharmony_ci        if (shift_dist < 0) {
bf215546Sopenharmony_ci            m = _mesa_short_shift_right_jam64(m_64, -shift_dist);
bf215546Sopenharmony_ci        } else {
bf215546Sopenharmony_ci            m = (uint32_t) m_64 << shift_dist;
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    return _mesa_round_f32(s, e, m, true);
bf215546Sopenharmony_ci}
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci/**
bf215546Sopenharmony_ci * \brief Converts from 64bits to 32bits float and rounds according to
bf215546Sopenharmony_ci * instructed.
bf215546Sopenharmony_ci *
bf215546Sopenharmony_ci * From f64_to_f32()
bf215546Sopenharmony_ci */
bf215546Sopenharmony_cifloat
bf215546Sopenharmony_ci_mesa_double_to_f32(double val, bool rtz)
bf215546Sopenharmony_ci{
bf215546Sopenharmony_ci    const di_type di = {val};
bf215546Sopenharmony_ci    uint64_t flt_m = di.u & 0x0fffffffffffff;
bf215546Sopenharmony_ci    uint64_t flt_e = (di.u >> 52) & 0x7ff;
bf215546Sopenharmony_ci    uint64_t flt_s = (di.u >> 63) & 0x1;
bf215546Sopenharmony_ci    int32_t s, e, m = 0;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    s = flt_s;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    if (flt_e == 0x7ff) {
bf215546Sopenharmony_ci        if (flt_m != 0) {
bf215546Sopenharmony_ci            /* 'val' is a NaN, return NaN */
bf215546Sopenharmony_ci            fi_type result;
bf215546Sopenharmony_ci            e = 0xff;
bf215546Sopenharmony_ci            m = 0x1;
bf215546Sopenharmony_ci            result.u = (s << 31) + (e << 23) + m;
bf215546Sopenharmony_ci            return result.f;
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci        /* 'val' is Inf, return Inf */
bf215546Sopenharmony_ci        fi_type result;
bf215546Sopenharmony_ci        e = 0xff;
bf215546Sopenharmony_ci        result.u = (s << 31) + (e << 23) + m;
bf215546Sopenharmony_ci        return result.f;
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    if (!(flt_e | flt_m)) {
bf215546Sopenharmony_ci        /* 'val' is zero, return zero */
bf215546Sopenharmony_ci        fi_type result;
bf215546Sopenharmony_ci        e = 0;
bf215546Sopenharmony_ci        result.u = (s << 31) + (e << 23) + m;
bf215546Sopenharmony_ci        return result.f;
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    m = _mesa_short_shift_right_jam64(flt_m, 22);
bf215546Sopenharmony_ci    if ( ! (flt_e | m) ) {
bf215546Sopenharmony_ci        /* 'val' is denorm, return zero */
bf215546Sopenharmony_ci        fi_type result;
bf215546Sopenharmony_ci        e = 0;
bf215546Sopenharmony_ci        result.u = (s << 31) + (e << 23) + m;
bf215546Sopenharmony_ci        return result.f;
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    return _mesa_round_f32(s, flt_e - 0x381, m | 0x40000000, rtz);
bf215546Sopenharmony_ci}
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci/**
bf215546Sopenharmony_ci * \brief Converts from 32bits to 16bits float and rounds the result to zero.
bf215546Sopenharmony_ci *
bf215546Sopenharmony_ci * From f32_to_f16()
bf215546Sopenharmony_ci */
bf215546Sopenharmony_ciuint16_t
bf215546Sopenharmony_ci_mesa_float_to_half_rtz_slow(float val)
bf215546Sopenharmony_ci{
bf215546Sopenharmony_ci    const fi_type fi = {val};
bf215546Sopenharmony_ci    const uint32_t flt_m = fi.u & 0x7fffff;
bf215546Sopenharmony_ci    const uint32_t flt_e = (fi.u >> 23) & 0xff;
bf215546Sopenharmony_ci    const uint32_t flt_s = (fi.u >> 31) & 0x1;
bf215546Sopenharmony_ci    int16_t s, e, m = 0;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    s = flt_s;
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    if (flt_e == 0xff) {
bf215546Sopenharmony_ci        if (flt_m != 0) {
bf215546Sopenharmony_ci            /* 'val' is a NaN, return NaN */
bf215546Sopenharmony_ci            e = 0x1f;
bf215546Sopenharmony_ci            /* Retain the top bits of a NaN to make sure that the quiet/signaling
bf215546Sopenharmony_ci            * status stays the same.
bf215546Sopenharmony_ci            */
bf215546Sopenharmony_ci            m = flt_m >> 13;
bf215546Sopenharmony_ci            if (!m)
bf215546Sopenharmony_ci               m = 1;
bf215546Sopenharmony_ci            return (s << 15) + (e << 10) + m;
bf215546Sopenharmony_ci        }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci        /* 'val' is Inf, return Inf */
bf215546Sopenharmony_ci        e = 0x1f;
bf215546Sopenharmony_ci        return (s << 15) + (e << 10) + m;
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    if (!(flt_e | flt_m)) {
bf215546Sopenharmony_ci        /* 'val' is zero, return zero */
bf215546Sopenharmony_ci        e = 0;
bf215546Sopenharmony_ci        return (s << 15) + (e << 10) + m;
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    m = flt_m >> 9 | ((flt_m & 0x1ff) != 0);
bf215546Sopenharmony_ci    if ( ! (flt_e | m) ) {
bf215546Sopenharmony_ci        /* 'val' is denorm, return zero */
bf215546Sopenharmony_ci        e = 0;
bf215546Sopenharmony_ci        return (s << 15) + (e << 10) + m;
bf215546Sopenharmony_ci    }
bf215546Sopenharmony_ci
bf215546Sopenharmony_ci    return _mesa_roundtozero_f16(s, flt_e - 0x71, m | 0x4000);
bf215546Sopenharmony_ci}