162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0-or-later 262306a36Sopenharmony_ci/* 362306a36Sopenharmony_ci * Linux/PA-RISC Project (http://www.parisc-linux.org/) 462306a36Sopenharmony_ci * 562306a36Sopenharmony_ci * Floating-point emulation code 662306a36Sopenharmony_ci * Copyright (C) 2001 Hewlett-Packard (Paul Bame) <bame@debian.org> 762306a36Sopenharmony_ci */ 862306a36Sopenharmony_ci/* 962306a36Sopenharmony_ci * BEGIN_DESC 1062306a36Sopenharmony_ci * 1162306a36Sopenharmony_ci * File: 1262306a36Sopenharmony_ci * @(#) pa/spmath/sfmpy.c $Revision: 1.1 $ 1362306a36Sopenharmony_ci * 1462306a36Sopenharmony_ci * Purpose: 1562306a36Sopenharmony_ci * Single Precision Floating-point Multiply 1662306a36Sopenharmony_ci * 1762306a36Sopenharmony_ci * External Interfaces: 1862306a36Sopenharmony_ci * sgl_fmpy(srcptr1,srcptr2,dstptr,status) 1962306a36Sopenharmony_ci * 2062306a36Sopenharmony_ci * Internal Interfaces: 2162306a36Sopenharmony_ci * 2262306a36Sopenharmony_ci * Theory: 2362306a36Sopenharmony_ci * <<please update with a overview of the operation of this file>> 2462306a36Sopenharmony_ci * 2562306a36Sopenharmony_ci * END_DESC 2662306a36Sopenharmony_ci*/ 2762306a36Sopenharmony_ci 2862306a36Sopenharmony_ci 2962306a36Sopenharmony_ci#include "float.h" 3062306a36Sopenharmony_ci#include "sgl_float.h" 3162306a36Sopenharmony_ci 3262306a36Sopenharmony_ci/* 3362306a36Sopenharmony_ci * Single Precision Floating-point Multiply 3462306a36Sopenharmony_ci */ 3562306a36Sopenharmony_ci 3662306a36Sopenharmony_ciint 3762306a36Sopenharmony_cisgl_fmpy( 3862306a36Sopenharmony_ci sgl_floating_point *srcptr1, 3962306a36Sopenharmony_ci sgl_floating_point *srcptr2, 4062306a36Sopenharmony_ci sgl_floating_point *dstptr, 4162306a36Sopenharmony_ci unsigned int *status) 4262306a36Sopenharmony_ci{ 4362306a36Sopenharmony_ci register unsigned int opnd1, opnd2, opnd3, result; 4462306a36Sopenharmony_ci register int dest_exponent, count; 4562306a36Sopenharmony_ci register boolean inexact = FALSE, guardbit = FALSE, stickybit = FALSE; 4662306a36Sopenharmony_ci boolean is_tiny; 4762306a36Sopenharmony_ci 4862306a36Sopenharmony_ci opnd1 = *srcptr1; 4962306a36Sopenharmony_ci opnd2 = *srcptr2; 5062306a36Sopenharmony_ci /* 5162306a36Sopenharmony_ci * set sign bit of result 5262306a36Sopenharmony_ci */ 5362306a36Sopenharmony_ci if (Sgl_sign(opnd1) ^ Sgl_sign(opnd2)) Sgl_setnegativezero(result); 5462306a36Sopenharmony_ci else Sgl_setzero(result); 5562306a36Sopenharmony_ci /* 5662306a36Sopenharmony_ci * check first operand for NaN's or infinity 5762306a36Sopenharmony_ci */ 5862306a36Sopenharmony_ci if (Sgl_isinfinity_exponent(opnd1)) { 5962306a36Sopenharmony_ci if (Sgl_iszero_mantissa(opnd1)) { 6062306a36Sopenharmony_ci if (Sgl_isnotnan(opnd2)) { 6162306a36Sopenharmony_ci if (Sgl_iszero_exponentmantissa(opnd2)) { 6262306a36Sopenharmony_ci /* 6362306a36Sopenharmony_ci * invalid since operands are infinity 6462306a36Sopenharmony_ci * and zero 6562306a36Sopenharmony_ci */ 6662306a36Sopenharmony_ci if (Is_invalidtrap_enabled()) 6762306a36Sopenharmony_ci return(INVALIDEXCEPTION); 6862306a36Sopenharmony_ci Set_invalidflag(); 6962306a36Sopenharmony_ci Sgl_makequietnan(result); 7062306a36Sopenharmony_ci *dstptr = result; 7162306a36Sopenharmony_ci return(NOEXCEPTION); 7262306a36Sopenharmony_ci } 7362306a36Sopenharmony_ci /* 7462306a36Sopenharmony_ci * return infinity 7562306a36Sopenharmony_ci */ 7662306a36Sopenharmony_ci Sgl_setinfinity_exponentmantissa(result); 7762306a36Sopenharmony_ci *dstptr = result; 7862306a36Sopenharmony_ci return(NOEXCEPTION); 7962306a36Sopenharmony_ci } 8062306a36Sopenharmony_ci } 8162306a36Sopenharmony_ci else { 8262306a36Sopenharmony_ci /* 8362306a36Sopenharmony_ci * is NaN; signaling or quiet? 8462306a36Sopenharmony_ci */ 8562306a36Sopenharmony_ci if (Sgl_isone_signaling(opnd1)) { 8662306a36Sopenharmony_ci /* trap if INVALIDTRAP enabled */ 8762306a36Sopenharmony_ci if (Is_invalidtrap_enabled()) 8862306a36Sopenharmony_ci return(INVALIDEXCEPTION); 8962306a36Sopenharmony_ci /* make NaN quiet */ 9062306a36Sopenharmony_ci Set_invalidflag(); 9162306a36Sopenharmony_ci Sgl_set_quiet(opnd1); 9262306a36Sopenharmony_ci } 9362306a36Sopenharmony_ci /* 9462306a36Sopenharmony_ci * is second operand a signaling NaN? 9562306a36Sopenharmony_ci */ 9662306a36Sopenharmony_ci else if (Sgl_is_signalingnan(opnd2)) { 9762306a36Sopenharmony_ci /* trap if INVALIDTRAP enabled */ 9862306a36Sopenharmony_ci if (Is_invalidtrap_enabled()) 9962306a36Sopenharmony_ci return(INVALIDEXCEPTION); 10062306a36Sopenharmony_ci /* make NaN quiet */ 10162306a36Sopenharmony_ci Set_invalidflag(); 10262306a36Sopenharmony_ci Sgl_set_quiet(opnd2); 10362306a36Sopenharmony_ci *dstptr = opnd2; 10462306a36Sopenharmony_ci return(NOEXCEPTION); 10562306a36Sopenharmony_ci } 10662306a36Sopenharmony_ci /* 10762306a36Sopenharmony_ci * return quiet NaN 10862306a36Sopenharmony_ci */ 10962306a36Sopenharmony_ci *dstptr = opnd1; 11062306a36Sopenharmony_ci return(NOEXCEPTION); 11162306a36Sopenharmony_ci } 11262306a36Sopenharmony_ci } 11362306a36Sopenharmony_ci /* 11462306a36Sopenharmony_ci * check second operand for NaN's or infinity 11562306a36Sopenharmony_ci */ 11662306a36Sopenharmony_ci if (Sgl_isinfinity_exponent(opnd2)) { 11762306a36Sopenharmony_ci if (Sgl_iszero_mantissa(opnd2)) { 11862306a36Sopenharmony_ci if (Sgl_iszero_exponentmantissa(opnd1)) { 11962306a36Sopenharmony_ci /* invalid since operands are zero & infinity */ 12062306a36Sopenharmony_ci if (Is_invalidtrap_enabled()) 12162306a36Sopenharmony_ci return(INVALIDEXCEPTION); 12262306a36Sopenharmony_ci Set_invalidflag(); 12362306a36Sopenharmony_ci Sgl_makequietnan(opnd2); 12462306a36Sopenharmony_ci *dstptr = opnd2; 12562306a36Sopenharmony_ci return(NOEXCEPTION); 12662306a36Sopenharmony_ci } 12762306a36Sopenharmony_ci /* 12862306a36Sopenharmony_ci * return infinity 12962306a36Sopenharmony_ci */ 13062306a36Sopenharmony_ci Sgl_setinfinity_exponentmantissa(result); 13162306a36Sopenharmony_ci *dstptr = result; 13262306a36Sopenharmony_ci return(NOEXCEPTION); 13362306a36Sopenharmony_ci } 13462306a36Sopenharmony_ci /* 13562306a36Sopenharmony_ci * is NaN; signaling or quiet? 13662306a36Sopenharmony_ci */ 13762306a36Sopenharmony_ci if (Sgl_isone_signaling(opnd2)) { 13862306a36Sopenharmony_ci /* trap if INVALIDTRAP enabled */ 13962306a36Sopenharmony_ci if (Is_invalidtrap_enabled()) return(INVALIDEXCEPTION); 14062306a36Sopenharmony_ci 14162306a36Sopenharmony_ci /* make NaN quiet */ 14262306a36Sopenharmony_ci Set_invalidflag(); 14362306a36Sopenharmony_ci Sgl_set_quiet(opnd2); 14462306a36Sopenharmony_ci } 14562306a36Sopenharmony_ci /* 14662306a36Sopenharmony_ci * return quiet NaN 14762306a36Sopenharmony_ci */ 14862306a36Sopenharmony_ci *dstptr = opnd2; 14962306a36Sopenharmony_ci return(NOEXCEPTION); 15062306a36Sopenharmony_ci } 15162306a36Sopenharmony_ci /* 15262306a36Sopenharmony_ci * Generate exponent 15362306a36Sopenharmony_ci */ 15462306a36Sopenharmony_ci dest_exponent = Sgl_exponent(opnd1) + Sgl_exponent(opnd2) - SGL_BIAS; 15562306a36Sopenharmony_ci 15662306a36Sopenharmony_ci /* 15762306a36Sopenharmony_ci * Generate mantissa 15862306a36Sopenharmony_ci */ 15962306a36Sopenharmony_ci if (Sgl_isnotzero_exponent(opnd1)) { 16062306a36Sopenharmony_ci /* set hidden bit */ 16162306a36Sopenharmony_ci Sgl_clear_signexponent_set_hidden(opnd1); 16262306a36Sopenharmony_ci } 16362306a36Sopenharmony_ci else { 16462306a36Sopenharmony_ci /* check for zero */ 16562306a36Sopenharmony_ci if (Sgl_iszero_mantissa(opnd1)) { 16662306a36Sopenharmony_ci Sgl_setzero_exponentmantissa(result); 16762306a36Sopenharmony_ci *dstptr = result; 16862306a36Sopenharmony_ci return(NOEXCEPTION); 16962306a36Sopenharmony_ci } 17062306a36Sopenharmony_ci /* is denormalized, adjust exponent */ 17162306a36Sopenharmony_ci Sgl_clear_signexponent(opnd1); 17262306a36Sopenharmony_ci Sgl_leftshiftby1(opnd1); 17362306a36Sopenharmony_ci Sgl_normalize(opnd1,dest_exponent); 17462306a36Sopenharmony_ci } 17562306a36Sopenharmony_ci /* opnd2 needs to have hidden bit set with msb in hidden bit */ 17662306a36Sopenharmony_ci if (Sgl_isnotzero_exponent(opnd2)) { 17762306a36Sopenharmony_ci Sgl_clear_signexponent_set_hidden(opnd2); 17862306a36Sopenharmony_ci } 17962306a36Sopenharmony_ci else { 18062306a36Sopenharmony_ci /* check for zero */ 18162306a36Sopenharmony_ci if (Sgl_iszero_mantissa(opnd2)) { 18262306a36Sopenharmony_ci Sgl_setzero_exponentmantissa(result); 18362306a36Sopenharmony_ci *dstptr = result; 18462306a36Sopenharmony_ci return(NOEXCEPTION); 18562306a36Sopenharmony_ci } 18662306a36Sopenharmony_ci /* is denormalized; want to normalize */ 18762306a36Sopenharmony_ci Sgl_clear_signexponent(opnd2); 18862306a36Sopenharmony_ci Sgl_leftshiftby1(opnd2); 18962306a36Sopenharmony_ci Sgl_normalize(opnd2,dest_exponent); 19062306a36Sopenharmony_ci } 19162306a36Sopenharmony_ci 19262306a36Sopenharmony_ci /* Multiply two source mantissas together */ 19362306a36Sopenharmony_ci 19462306a36Sopenharmony_ci Sgl_leftshiftby4(opnd2); /* make room for guard bits */ 19562306a36Sopenharmony_ci Sgl_setzero(opnd3); 19662306a36Sopenharmony_ci /* 19762306a36Sopenharmony_ci * Four bits at a time are inspected in each loop, and a 19862306a36Sopenharmony_ci * simple shift and add multiply algorithm is used. 19962306a36Sopenharmony_ci */ 20062306a36Sopenharmony_ci for (count=1;count<SGL_P;count+=4) { 20162306a36Sopenharmony_ci stickybit |= Slow4(opnd3); 20262306a36Sopenharmony_ci Sgl_rightshiftby4(opnd3); 20362306a36Sopenharmony_ci if (Sbit28(opnd1)) Sall(opnd3) += (Sall(opnd2) << 3); 20462306a36Sopenharmony_ci if (Sbit29(opnd1)) Sall(opnd3) += (Sall(opnd2) << 2); 20562306a36Sopenharmony_ci if (Sbit30(opnd1)) Sall(opnd3) += (Sall(opnd2) << 1); 20662306a36Sopenharmony_ci if (Sbit31(opnd1)) Sall(opnd3) += Sall(opnd2); 20762306a36Sopenharmony_ci Sgl_rightshiftby4(opnd1); 20862306a36Sopenharmony_ci } 20962306a36Sopenharmony_ci /* make sure result is left-justified */ 21062306a36Sopenharmony_ci if (Sgl_iszero_sign(opnd3)) { 21162306a36Sopenharmony_ci Sgl_leftshiftby1(opnd3); 21262306a36Sopenharmony_ci } 21362306a36Sopenharmony_ci else { 21462306a36Sopenharmony_ci /* result mantissa >= 2. */ 21562306a36Sopenharmony_ci dest_exponent++; 21662306a36Sopenharmony_ci } 21762306a36Sopenharmony_ci /* check for denormalized result */ 21862306a36Sopenharmony_ci while (Sgl_iszero_sign(opnd3)) { 21962306a36Sopenharmony_ci Sgl_leftshiftby1(opnd3); 22062306a36Sopenharmony_ci dest_exponent--; 22162306a36Sopenharmony_ci } 22262306a36Sopenharmony_ci /* 22362306a36Sopenharmony_ci * check for guard, sticky and inexact bits 22462306a36Sopenharmony_ci */ 22562306a36Sopenharmony_ci stickybit |= Sgl_all(opnd3) << (SGL_BITLENGTH - SGL_EXP_LENGTH + 1); 22662306a36Sopenharmony_ci guardbit = Sbit24(opnd3); 22762306a36Sopenharmony_ci inexact = guardbit | stickybit; 22862306a36Sopenharmony_ci 22962306a36Sopenharmony_ci /* re-align mantissa */ 23062306a36Sopenharmony_ci Sgl_rightshiftby8(opnd3); 23162306a36Sopenharmony_ci 23262306a36Sopenharmony_ci /* 23362306a36Sopenharmony_ci * round result 23462306a36Sopenharmony_ci */ 23562306a36Sopenharmony_ci if (inexact && (dest_exponent>0 || Is_underflowtrap_enabled())) { 23662306a36Sopenharmony_ci Sgl_clear_signexponent(opnd3); 23762306a36Sopenharmony_ci switch (Rounding_mode()) { 23862306a36Sopenharmony_ci case ROUNDPLUS: 23962306a36Sopenharmony_ci if (Sgl_iszero_sign(result)) 24062306a36Sopenharmony_ci Sgl_increment(opnd3); 24162306a36Sopenharmony_ci break; 24262306a36Sopenharmony_ci case ROUNDMINUS: 24362306a36Sopenharmony_ci if (Sgl_isone_sign(result)) 24462306a36Sopenharmony_ci Sgl_increment(opnd3); 24562306a36Sopenharmony_ci break; 24662306a36Sopenharmony_ci case ROUNDNEAREST: 24762306a36Sopenharmony_ci if (guardbit) { 24862306a36Sopenharmony_ci if (stickybit || Sgl_isone_lowmantissa(opnd3)) 24962306a36Sopenharmony_ci Sgl_increment(opnd3); 25062306a36Sopenharmony_ci } 25162306a36Sopenharmony_ci } 25262306a36Sopenharmony_ci if (Sgl_isone_hidden(opnd3)) dest_exponent++; 25362306a36Sopenharmony_ci } 25462306a36Sopenharmony_ci Sgl_set_mantissa(result,opnd3); 25562306a36Sopenharmony_ci 25662306a36Sopenharmony_ci /* 25762306a36Sopenharmony_ci * Test for overflow 25862306a36Sopenharmony_ci */ 25962306a36Sopenharmony_ci if (dest_exponent >= SGL_INFINITY_EXPONENT) { 26062306a36Sopenharmony_ci /* trap if OVERFLOWTRAP enabled */ 26162306a36Sopenharmony_ci if (Is_overflowtrap_enabled()) { 26262306a36Sopenharmony_ci /* 26362306a36Sopenharmony_ci * Adjust bias of result 26462306a36Sopenharmony_ci */ 26562306a36Sopenharmony_ci Sgl_setwrapped_exponent(result,dest_exponent,ovfl); 26662306a36Sopenharmony_ci *dstptr = result; 26762306a36Sopenharmony_ci if (inexact) 26862306a36Sopenharmony_ci if (Is_inexacttrap_enabled()) 26962306a36Sopenharmony_ci return(OVERFLOWEXCEPTION | INEXACTEXCEPTION); 27062306a36Sopenharmony_ci else Set_inexactflag(); 27162306a36Sopenharmony_ci return(OVERFLOWEXCEPTION); 27262306a36Sopenharmony_ci } 27362306a36Sopenharmony_ci inexact = TRUE; 27462306a36Sopenharmony_ci Set_overflowflag(); 27562306a36Sopenharmony_ci /* set result to infinity or largest number */ 27662306a36Sopenharmony_ci Sgl_setoverflow(result); 27762306a36Sopenharmony_ci } 27862306a36Sopenharmony_ci /* 27962306a36Sopenharmony_ci * Test for underflow 28062306a36Sopenharmony_ci */ 28162306a36Sopenharmony_ci else if (dest_exponent <= 0) { 28262306a36Sopenharmony_ci /* trap if UNDERFLOWTRAP enabled */ 28362306a36Sopenharmony_ci if (Is_underflowtrap_enabled()) { 28462306a36Sopenharmony_ci /* 28562306a36Sopenharmony_ci * Adjust bias of result 28662306a36Sopenharmony_ci */ 28762306a36Sopenharmony_ci Sgl_setwrapped_exponent(result,dest_exponent,unfl); 28862306a36Sopenharmony_ci *dstptr = result; 28962306a36Sopenharmony_ci if (inexact) 29062306a36Sopenharmony_ci if (Is_inexacttrap_enabled()) 29162306a36Sopenharmony_ci return(UNDERFLOWEXCEPTION | INEXACTEXCEPTION); 29262306a36Sopenharmony_ci else Set_inexactflag(); 29362306a36Sopenharmony_ci return(UNDERFLOWEXCEPTION); 29462306a36Sopenharmony_ci } 29562306a36Sopenharmony_ci 29662306a36Sopenharmony_ci /* Determine if should set underflow flag */ 29762306a36Sopenharmony_ci is_tiny = TRUE; 29862306a36Sopenharmony_ci if (dest_exponent == 0 && inexact) { 29962306a36Sopenharmony_ci switch (Rounding_mode()) { 30062306a36Sopenharmony_ci case ROUNDPLUS: 30162306a36Sopenharmony_ci if (Sgl_iszero_sign(result)) { 30262306a36Sopenharmony_ci Sgl_increment(opnd3); 30362306a36Sopenharmony_ci if (Sgl_isone_hiddenoverflow(opnd3)) 30462306a36Sopenharmony_ci is_tiny = FALSE; 30562306a36Sopenharmony_ci Sgl_decrement(opnd3); 30662306a36Sopenharmony_ci } 30762306a36Sopenharmony_ci break; 30862306a36Sopenharmony_ci case ROUNDMINUS: 30962306a36Sopenharmony_ci if (Sgl_isone_sign(result)) { 31062306a36Sopenharmony_ci Sgl_increment(opnd3); 31162306a36Sopenharmony_ci if (Sgl_isone_hiddenoverflow(opnd3)) 31262306a36Sopenharmony_ci is_tiny = FALSE; 31362306a36Sopenharmony_ci Sgl_decrement(opnd3); 31462306a36Sopenharmony_ci } 31562306a36Sopenharmony_ci break; 31662306a36Sopenharmony_ci case ROUNDNEAREST: 31762306a36Sopenharmony_ci if (guardbit && (stickybit || 31862306a36Sopenharmony_ci Sgl_isone_lowmantissa(opnd3))) { 31962306a36Sopenharmony_ci Sgl_increment(opnd3); 32062306a36Sopenharmony_ci if (Sgl_isone_hiddenoverflow(opnd3)) 32162306a36Sopenharmony_ci is_tiny = FALSE; 32262306a36Sopenharmony_ci Sgl_decrement(opnd3); 32362306a36Sopenharmony_ci } 32462306a36Sopenharmony_ci break; 32562306a36Sopenharmony_ci } 32662306a36Sopenharmony_ci } 32762306a36Sopenharmony_ci 32862306a36Sopenharmony_ci /* 32962306a36Sopenharmony_ci * denormalize result or set to signed zero 33062306a36Sopenharmony_ci */ 33162306a36Sopenharmony_ci stickybit = inexact; 33262306a36Sopenharmony_ci Sgl_denormalize(opnd3,dest_exponent,guardbit,stickybit,inexact); 33362306a36Sopenharmony_ci 33462306a36Sopenharmony_ci /* return zero or smallest number */ 33562306a36Sopenharmony_ci if (inexact) { 33662306a36Sopenharmony_ci switch (Rounding_mode()) { 33762306a36Sopenharmony_ci case ROUNDPLUS: 33862306a36Sopenharmony_ci if (Sgl_iszero_sign(result)) { 33962306a36Sopenharmony_ci Sgl_increment(opnd3); 34062306a36Sopenharmony_ci } 34162306a36Sopenharmony_ci break; 34262306a36Sopenharmony_ci case ROUNDMINUS: 34362306a36Sopenharmony_ci if (Sgl_isone_sign(result)) { 34462306a36Sopenharmony_ci Sgl_increment(opnd3); 34562306a36Sopenharmony_ci } 34662306a36Sopenharmony_ci break; 34762306a36Sopenharmony_ci case ROUNDNEAREST: 34862306a36Sopenharmony_ci if (guardbit && (stickybit || 34962306a36Sopenharmony_ci Sgl_isone_lowmantissa(opnd3))) { 35062306a36Sopenharmony_ci Sgl_increment(opnd3); 35162306a36Sopenharmony_ci } 35262306a36Sopenharmony_ci break; 35362306a36Sopenharmony_ci } 35462306a36Sopenharmony_ci if (is_tiny) Set_underflowflag(); 35562306a36Sopenharmony_ci } 35662306a36Sopenharmony_ci Sgl_set_exponentmantissa(result,opnd3); 35762306a36Sopenharmony_ci } 35862306a36Sopenharmony_ci else Sgl_set_exponent(result,dest_exponent); 35962306a36Sopenharmony_ci *dstptr = result; 36062306a36Sopenharmony_ci 36162306a36Sopenharmony_ci /* check for inexact */ 36262306a36Sopenharmony_ci if (inexact) { 36362306a36Sopenharmony_ci if (Is_inexacttrap_enabled()) return(INEXACTEXCEPTION); 36462306a36Sopenharmony_ci else Set_inexactflag(); 36562306a36Sopenharmony_ci } 36662306a36Sopenharmony_ci return(NOEXCEPTION); 36762306a36Sopenharmony_ci} 368