src/core/SkHalf.cpp

cb93a386Sopenharmony_ci/*
cb93a386Sopenharmony_ci * Copyright 2014 Google Inc.
cb93a386Sopenharmony_ci *
cb93a386Sopenharmony_ci * Use of this source code is governed by a BSD-style license that can be
cb93a386Sopenharmony_ci * found in the LICENSE file.
cb93a386Sopenharmony_ci */
cb93a386Sopenharmony_ci
cb93a386Sopenharmony_ci#include "include/private/SkFloatBits.h"
cb93a386Sopenharmony_ci#include "include/private/SkHalf.h"
cb93a386Sopenharmony_ci
cb93a386Sopenharmony_ciuint16_t halfMantissa(SkHalf h) {
cb93a386Sopenharmony_ci    return h & 0x03ff;
cb93a386Sopenharmony_ci}
cb93a386Sopenharmony_ci
cb93a386Sopenharmony_ciuint16_t halfExponent(SkHalf h) {
cb93a386Sopenharmony_ci    return (h >> 10) & 0x001f;
cb93a386Sopenharmony_ci}
cb93a386Sopenharmony_ci
cb93a386Sopenharmony_ciuint16_t halfSign(SkHalf h) {
cb93a386Sopenharmony_ci    return h >> 15;
cb93a386Sopenharmony_ci}
cb93a386Sopenharmony_ci
cb93a386Sopenharmony_ciunion FloatUIntUnion {
cb93a386Sopenharmony_ci    uint32_t fUInt;    // this must come first for the initializations below to work
cb93a386Sopenharmony_ci    float    fFloat;
cb93a386Sopenharmony_ci};
cb93a386Sopenharmony_ci
cb93a386Sopenharmony_ci// based on Fabien Giesen's float_to_half_fast3()
cb93a386Sopenharmony_ci// see https://gist.github.com/rygorous/2156668
cb93a386Sopenharmony_ciSkHalf SkFloatToHalf(float f) {
cb93a386Sopenharmony_ci    static const uint32_t f32infty = { 255 << 23 };
cb93a386Sopenharmony_ci    static const uint32_t f16infty = { 31 << 23 };
cb93a386Sopenharmony_ci    static const FloatUIntUnion magic = { 15 << 23 };
cb93a386Sopenharmony_ci    static const uint32_t sign_mask = 0x80000000u;
cb93a386Sopenharmony_ci    static const uint32_t round_mask = ~0xfffu;
cb93a386Sopenharmony_ci    SkHalf o = 0;
cb93a386Sopenharmony_ci
cb93a386Sopenharmony_ci    FloatUIntUnion floatUnion;
cb93a386Sopenharmony_ci    floatUnion.fFloat = f;
cb93a386Sopenharmony_ci
cb93a386Sopenharmony_ci    uint32_t sign = floatUnion.fUInt & sign_mask;
cb93a386Sopenharmony_ci    floatUnion.fUInt ^= sign;
cb93a386Sopenharmony_ci
cb93a386Sopenharmony_ci    // NOTE all the integer compares in this function can be safely
cb93a386Sopenharmony_ci    // compiled into signed compares since all operands are below
cb93a386Sopenharmony_ci    // 0x80000000. Important if you want fast straight SSE2 code
cb93a386Sopenharmony_ci    // (since there's no unsigned PCMPGTD).
cb93a386Sopenharmony_ci
cb93a386Sopenharmony_ci    // Inf or NaN (all exponent bits set)
cb93a386Sopenharmony_ci    if (floatUnion.fUInt >= f32infty)
cb93a386Sopenharmony_ci        // NaN->qNaN and Inf->Inf
cb93a386Sopenharmony_ci        o = (floatUnion.fUInt > f32infty) ? 0x7e00 : 0x7c00;
cb93a386Sopenharmony_ci    // (De)normalized number or zero
cb93a386Sopenharmony_ci    else {
cb93a386Sopenharmony_ci        floatUnion.fUInt &= round_mask;
cb93a386Sopenharmony_ci        floatUnion.fFloat *= magic.fFloat;
cb93a386Sopenharmony_ci        floatUnion.fUInt -= round_mask;
cb93a386Sopenharmony_ci        // Clamp to signed infinity if overflowed
cb93a386Sopenharmony_ci        if (floatUnion.fUInt > f16infty) {
cb93a386Sopenharmony_ci            floatUnion.fUInt = f16infty;
cb93a386Sopenharmony_ci        }
cb93a386Sopenharmony_ci
cb93a386Sopenharmony_ci        o = floatUnion.fUInt >> 13; // Take the bits!
cb93a386Sopenharmony_ci    }
cb93a386Sopenharmony_ci
cb93a386Sopenharmony_ci    o |= sign >> 16;
cb93a386Sopenharmony_ci    return o;
cb93a386Sopenharmony_ci}
cb93a386Sopenharmony_ci
cb93a386Sopenharmony_ci// based on Fabien Giesen's half_to_float_fast2()
cb93a386Sopenharmony_ci// see https://fgiesen.wordpress.com/2012/03/28/half-to-float-done-quic/
cb93a386Sopenharmony_cifloat SkHalfToFloat(SkHalf h) {
cb93a386Sopenharmony_ci    static const FloatUIntUnion magic = { 126 << 23 };
cb93a386Sopenharmony_ci    FloatUIntUnion o;
cb93a386Sopenharmony_ci
cb93a386Sopenharmony_ci    if (halfExponent(h) == 0)
cb93a386Sopenharmony_ci    {
cb93a386Sopenharmony_ci        // Zero / Denormal
cb93a386Sopenharmony_ci        o.fUInt = magic.fUInt + halfMantissa(h);
cb93a386Sopenharmony_ci        o.fFloat -= magic.fFloat;
cb93a386Sopenharmony_ci    }
cb93a386Sopenharmony_ci    else
cb93a386Sopenharmony_ci    {
cb93a386Sopenharmony_ci        // Set mantissa
cb93a386Sopenharmony_ci        o.fUInt = halfMantissa(h) << 13;
cb93a386Sopenharmony_ci        // Set exponent
cb93a386Sopenharmony_ci        if (halfExponent(h) == 0x1f)
cb93a386Sopenharmony_ci            // Inf/NaN
cb93a386Sopenharmony_ci            o.fUInt |= (255 << 23);
cb93a386Sopenharmony_ci        else
cb93a386Sopenharmony_ci            o.fUInt |= ((127 - 15 + halfExponent(h)) << 23);
cb93a386Sopenharmony_ci    }
cb93a386Sopenharmony_ci
cb93a386Sopenharmony_ci    // Set sign
cb93a386Sopenharmony_ci    o.fUInt |= (halfSign(h) << 31);
cb93a386Sopenharmony_ci    return o.fFloat;
cb93a386Sopenharmony_ci}