1cb93a386Sopenharmony_ci/* 2cb93a386Sopenharmony_ci * Copyright 2015 Google Inc. 3cb93a386Sopenharmony_ci * 4cb93a386Sopenharmony_ci * Use of this source code is governed by a BSD-style license that can be 5cb93a386Sopenharmony_ci * found in the LICENSE file. 6cb93a386Sopenharmony_ci */ 7cb93a386Sopenharmony_ci 8cb93a386Sopenharmony_ci#include "include/private/SkNx.h" 9cb93a386Sopenharmony_ci#include "include/utils/SkRandom.h" 10cb93a386Sopenharmony_ci#include "src/core/Sk4px.h" 11cb93a386Sopenharmony_ci#include "tests/Test.h" 12cb93a386Sopenharmony_ci 13cb93a386Sopenharmony_citemplate <int N> 14cb93a386Sopenharmony_cistatic void test_Nf(skiatest::Reporter* r) { 15cb93a386Sopenharmony_ci 16cb93a386Sopenharmony_ci auto assert_nearly_eq = [&](float eps, const SkNx<N, float>& v, 17cb93a386Sopenharmony_ci float a, float b, float c, float d) { 18cb93a386Sopenharmony_ci auto close = [=](float a, float b) { return fabsf(a-b) <= eps; }; 19cb93a386Sopenharmony_ci float vals[4]; 20cb93a386Sopenharmony_ci v.store(vals); 21cb93a386Sopenharmony_ci bool ok = close(vals[0], a) && close(vals[1], b) 22cb93a386Sopenharmony_ci && close( v[0], a) && close( v[1], b); 23cb93a386Sopenharmony_ci REPORTER_ASSERT(r, ok); 24cb93a386Sopenharmony_ci if (N == 4) { 25cb93a386Sopenharmony_ci ok = close(vals[2], c) && close(vals[3], d) 26cb93a386Sopenharmony_ci && close( v[2], c) && close( v[3], d); 27cb93a386Sopenharmony_ci REPORTER_ASSERT(r, ok); 28cb93a386Sopenharmony_ci } 29cb93a386Sopenharmony_ci }; 30cb93a386Sopenharmony_ci auto assert_eq = [&](const SkNx<N, float>& v, float a, float b, float c, float d) { 31cb93a386Sopenharmony_ci return assert_nearly_eq(0, v, a,b,c,d); 32cb93a386Sopenharmony_ci }; 33cb93a386Sopenharmony_ci 34cb93a386Sopenharmony_ci float vals[] = {3, 4, 5, 6}; 35cb93a386Sopenharmony_ci SkNx<N,float> a = SkNx<N,float>::Load(vals), 36cb93a386Sopenharmony_ci b(a), 37cb93a386Sopenharmony_ci c = a; 38cb93a386Sopenharmony_ci SkNx<N,float> d; 39cb93a386Sopenharmony_ci d = a; 40cb93a386Sopenharmony_ci 41cb93a386Sopenharmony_ci assert_eq(a, 3, 4, 5, 6); 42cb93a386Sopenharmony_ci assert_eq(b, 3, 4, 5, 6); 43cb93a386Sopenharmony_ci assert_eq(c, 3, 4, 5, 6); 44cb93a386Sopenharmony_ci assert_eq(d, 3, 4, 5, 6); 45cb93a386Sopenharmony_ci 46cb93a386Sopenharmony_ci assert_eq(a+b, 6, 8, 10, 12); 47cb93a386Sopenharmony_ci assert_eq(a*b, 9, 16, 25, 36); 48cb93a386Sopenharmony_ci assert_eq(a*b-b, 6, 12, 20, 30); 49cb93a386Sopenharmony_ci assert_eq((a*b).sqrt(), 3, 4, 5, 6); 50cb93a386Sopenharmony_ci assert_eq(a/b, 1, 1, 1, 1); 51cb93a386Sopenharmony_ci assert_eq(SkNx<N,float>(0)-a, -3, -4, -5, -6); 52cb93a386Sopenharmony_ci 53cb93a386Sopenharmony_ci SkNx<N,float> fours(4); 54cb93a386Sopenharmony_ci 55cb93a386Sopenharmony_ci assert_eq(fours.sqrt(), 2,2,2,2); 56cb93a386Sopenharmony_ci 57cb93a386Sopenharmony_ci assert_eq(SkNx<N,float>::Min(a, fours), 3, 4, 4, 4); 58cb93a386Sopenharmony_ci assert_eq(SkNx<N,float>::Max(a, fours), 4, 4, 5, 6); 59cb93a386Sopenharmony_ci 60cb93a386Sopenharmony_ci // Test some comparisons. This is not exhaustive. 61cb93a386Sopenharmony_ci REPORTER_ASSERT(r, (a == b).allTrue()); 62cb93a386Sopenharmony_ci REPORTER_ASSERT(r, (a+b == a*b-b).anyTrue()); 63cb93a386Sopenharmony_ci REPORTER_ASSERT(r, !(a+b == a*b-b).allTrue()); 64cb93a386Sopenharmony_ci REPORTER_ASSERT(r, !(a+b == a*b).anyTrue()); 65cb93a386Sopenharmony_ci REPORTER_ASSERT(r, !(a != b).anyTrue()); 66cb93a386Sopenharmony_ci REPORTER_ASSERT(r, (a < fours).anyTrue()); 67cb93a386Sopenharmony_ci REPORTER_ASSERT(r, (a <= fours).anyTrue()); 68cb93a386Sopenharmony_ci REPORTER_ASSERT(r, !(a > fours).allTrue()); 69cb93a386Sopenharmony_ci REPORTER_ASSERT(r, !(a >= fours).allTrue()); 70cb93a386Sopenharmony_ci} 71cb93a386Sopenharmony_ci 72cb93a386Sopenharmony_ciDEF_TEST(SkNf, r) { 73cb93a386Sopenharmony_ci test_Nf<2>(r); 74cb93a386Sopenharmony_ci test_Nf<4>(r); 75cb93a386Sopenharmony_ci} 76cb93a386Sopenharmony_ci 77cb93a386Sopenharmony_citemplate <int N, typename T> 78cb93a386Sopenharmony_civoid test_Ni(skiatest::Reporter* r) { 79cb93a386Sopenharmony_ci auto assert_eq = [&](const SkNx<N,T>& v, T a, T b, T c, T d, T e, T f, T g, T h) { 80cb93a386Sopenharmony_ci T vals[8]; 81cb93a386Sopenharmony_ci v.store(vals); 82cb93a386Sopenharmony_ci 83cb93a386Sopenharmony_ci switch (N) { 84cb93a386Sopenharmony_ci case 8: 85cb93a386Sopenharmony_ci REPORTER_ASSERT(r, vals[4] == e && vals[5] == f && vals[6] == g && vals[7] == h); 86cb93a386Sopenharmony_ci [[fallthrough]]; 87cb93a386Sopenharmony_ci case 4: 88cb93a386Sopenharmony_ci REPORTER_ASSERT(r, vals[2] == c && vals[3] == d); 89cb93a386Sopenharmony_ci [[fallthrough]]; 90cb93a386Sopenharmony_ci case 2: 91cb93a386Sopenharmony_ci REPORTER_ASSERT(r, vals[0] == a && vals[1] == b); 92cb93a386Sopenharmony_ci } 93cb93a386Sopenharmony_ci switch (N) { 94cb93a386Sopenharmony_ci case 8: 95cb93a386Sopenharmony_ci REPORTER_ASSERT(r, v[4] == e && v[5] == f && v[6] == g && v[7] == h); 96cb93a386Sopenharmony_ci [[fallthrough]]; 97cb93a386Sopenharmony_ci case 4: 98cb93a386Sopenharmony_ci REPORTER_ASSERT(r, v[2] == c && v[3] == d); 99cb93a386Sopenharmony_ci [[fallthrough]]; 100cb93a386Sopenharmony_ci case 2: 101cb93a386Sopenharmony_ci REPORTER_ASSERT(r, v[0] == a && v[1] == b); 102cb93a386Sopenharmony_ci } 103cb93a386Sopenharmony_ci }; 104cb93a386Sopenharmony_ci 105cb93a386Sopenharmony_ci T vals[] = { 1,2,3,4,5,6,7,8 }; 106cb93a386Sopenharmony_ci SkNx<N,T> a = SkNx<N,T>::Load(vals), 107cb93a386Sopenharmony_ci b(a), 108cb93a386Sopenharmony_ci c = a; 109cb93a386Sopenharmony_ci SkNx<N,T> d; 110cb93a386Sopenharmony_ci d = a; 111cb93a386Sopenharmony_ci 112cb93a386Sopenharmony_ci assert_eq(a, 1,2,3,4,5,6,7,8); 113cb93a386Sopenharmony_ci assert_eq(b, 1,2,3,4,5,6,7,8); 114cb93a386Sopenharmony_ci assert_eq(c, 1,2,3,4,5,6,7,8); 115cb93a386Sopenharmony_ci assert_eq(d, 1,2,3,4,5,6,7,8); 116cb93a386Sopenharmony_ci 117cb93a386Sopenharmony_ci assert_eq(a+a, 2,4,6,8,10,12,14,16); 118cb93a386Sopenharmony_ci assert_eq(a*a, 1,4,9,16,25,36,49,64); 119cb93a386Sopenharmony_ci assert_eq(a*a-a, 0,2,6,12,20,30,42,56); 120cb93a386Sopenharmony_ci 121cb93a386Sopenharmony_ci assert_eq(a >> 2, 0,0,0,1,1,1,1,2); 122cb93a386Sopenharmony_ci assert_eq(a << 1, 2,4,6,8,10,12,14,16); 123cb93a386Sopenharmony_ci 124cb93a386Sopenharmony_ci REPORTER_ASSERT(r, a[1] == 2); 125cb93a386Sopenharmony_ci} 126cb93a386Sopenharmony_ci 127cb93a386Sopenharmony_ciDEF_TEST(SkNx, r) { 128cb93a386Sopenharmony_ci test_Ni<2, uint16_t>(r); 129cb93a386Sopenharmony_ci test_Ni<4, uint16_t>(r); 130cb93a386Sopenharmony_ci test_Ni<8, uint16_t>(r); 131cb93a386Sopenharmony_ci 132cb93a386Sopenharmony_ci test_Ni<2, int>(r); 133cb93a386Sopenharmony_ci test_Ni<4, int>(r); 134cb93a386Sopenharmony_ci test_Ni<8, int>(r); 135cb93a386Sopenharmony_ci} 136cb93a386Sopenharmony_ci 137cb93a386Sopenharmony_ciDEF_TEST(SkNi_min_lt, r) { 138cb93a386Sopenharmony_ci // Exhaustively check the 8x8 bit space. 139cb93a386Sopenharmony_ci for (int a = 0; a < (1<<8); a++) { 140cb93a386Sopenharmony_ci for (int b = 0; b < (1<<8); b++) { 141cb93a386Sopenharmony_ci Sk16b aw(a), bw(b); 142cb93a386Sopenharmony_ci REPORTER_ASSERT(r, Sk16b::Min(aw, bw)[0] == std::min(a, b)); 143cb93a386Sopenharmony_ci REPORTER_ASSERT(r, !(aw < bw)[0] == !(a < b)); 144cb93a386Sopenharmony_ci }} 145cb93a386Sopenharmony_ci 146cb93a386Sopenharmony_ci // Exhausting the 16x16 bit space is kind of slow, so only do that in release builds. 147cb93a386Sopenharmony_ci#ifdef SK_DEBUG 148cb93a386Sopenharmony_ci SkRandom rand; 149cb93a386Sopenharmony_ci for (int i = 0; i < (1<<16); i++) { 150cb93a386Sopenharmony_ci uint16_t a = rand.nextU() >> 16, 151cb93a386Sopenharmony_ci b = rand.nextU() >> 16; 152cb93a386Sopenharmony_ci REPORTER_ASSERT(r, Sk16h::Min(Sk16h(a), Sk16h(b))[0] == std::min(a, b)); 153cb93a386Sopenharmony_ci } 154cb93a386Sopenharmony_ci#else 155cb93a386Sopenharmony_ci for (int a = 0; a < (1<<16); a++) { 156cb93a386Sopenharmony_ci for (int b = 0; b < (1<<16); b++) { 157cb93a386Sopenharmony_ci REPORTER_ASSERT(r, Sk16h::Min(Sk16h(a), Sk16h(b))[0] == std::min(a, b)); 158cb93a386Sopenharmony_ci }} 159cb93a386Sopenharmony_ci#endif 160cb93a386Sopenharmony_ci} 161cb93a386Sopenharmony_ci 162cb93a386Sopenharmony_ciDEF_TEST(SkNi_saturatedAdd, r) { 163cb93a386Sopenharmony_ci for (int a = 0; a < (1<<8); a++) { 164cb93a386Sopenharmony_ci for (int b = 0; b < (1<<8); b++) { 165cb93a386Sopenharmony_ci int exact = a+b; 166cb93a386Sopenharmony_ci if (exact > 255) { exact = 255; } 167cb93a386Sopenharmony_ci if (exact < 0) { exact = 0; } 168cb93a386Sopenharmony_ci 169cb93a386Sopenharmony_ci REPORTER_ASSERT(r, Sk16b(a).saturatedAdd(Sk16b(b))[0] == exact); 170cb93a386Sopenharmony_ci } 171cb93a386Sopenharmony_ci } 172cb93a386Sopenharmony_ci} 173cb93a386Sopenharmony_ci 174cb93a386Sopenharmony_ciDEF_TEST(SkNi_mulHi, r) { 175cb93a386Sopenharmony_ci // First 8 primes. 176cb93a386Sopenharmony_ci Sk4u a{ 0x00020000, 0x00030000, 0x00050000, 0x00070000 }; 177cb93a386Sopenharmony_ci Sk4u b{ 0x000b0000, 0x000d0000, 0x00110000, 0x00130000 }; 178cb93a386Sopenharmony_ci 179cb93a386Sopenharmony_ci Sk4u q{22, 39, 85, 133}; 180cb93a386Sopenharmony_ci 181cb93a386Sopenharmony_ci Sk4u c = a.mulHi(b); 182cb93a386Sopenharmony_ci REPORTER_ASSERT(r, c[0] == q[0]); 183cb93a386Sopenharmony_ci REPORTER_ASSERT(r, c[1] == q[1]); 184cb93a386Sopenharmony_ci REPORTER_ASSERT(r, c[2] == q[2]); 185cb93a386Sopenharmony_ci REPORTER_ASSERT(r, c[3] == q[3]); 186cb93a386Sopenharmony_ci} 187cb93a386Sopenharmony_ci 188cb93a386Sopenharmony_ciDEF_TEST(Sk4px_muldiv255round, r) { 189cb93a386Sopenharmony_ci for (int a = 0; a < (1<<8); a++) { 190cb93a386Sopenharmony_ci for (int b = 0; b < (1<<8); b++) { 191cb93a386Sopenharmony_ci int exact = (a*b+127)/255; 192cb93a386Sopenharmony_ci 193cb93a386Sopenharmony_ci // Duplicate a and b 16x each. 194cb93a386Sopenharmony_ci Sk4px av = Sk16b(a), 195cb93a386Sopenharmony_ci bv = Sk16b(b); 196cb93a386Sopenharmony_ci 197cb93a386Sopenharmony_ci // This way should always be exactly correct. 198cb93a386Sopenharmony_ci int correct = (av * bv).div255()[0]; 199cb93a386Sopenharmony_ci REPORTER_ASSERT(r, correct == exact); 200cb93a386Sopenharmony_ci 201cb93a386Sopenharmony_ci // We're a bit more flexible on this method: correct for 0 or 255, otherwise off by <=1. 202cb93a386Sopenharmony_ci int fast = av.approxMulDiv255(bv)[0]; 203cb93a386Sopenharmony_ci REPORTER_ASSERT(r, fast-exact >= -1 && fast-exact <= 1); 204cb93a386Sopenharmony_ci if (a == 0 || a == 255 || b == 0 || b == 255) { 205cb93a386Sopenharmony_ci REPORTER_ASSERT(r, fast == exact); 206cb93a386Sopenharmony_ci } 207cb93a386Sopenharmony_ci } 208cb93a386Sopenharmony_ci } 209cb93a386Sopenharmony_ci} 210cb93a386Sopenharmony_ci 211cb93a386Sopenharmony_ciDEF_TEST(SkNx_abs, r) { 212cb93a386Sopenharmony_ci auto fs = Sk4f(0.0f, -0.0f, 2.0f, -4.0f).abs(); 213cb93a386Sopenharmony_ci REPORTER_ASSERT(r, fs[0] == 0.0f); 214cb93a386Sopenharmony_ci REPORTER_ASSERT(r, fs[1] == 0.0f); 215cb93a386Sopenharmony_ci REPORTER_ASSERT(r, fs[2] == 2.0f); 216cb93a386Sopenharmony_ci REPORTER_ASSERT(r, fs[3] == 4.0f); 217cb93a386Sopenharmony_ci auto fshi = Sk2f(0.0f, -0.0f).abs(); 218cb93a386Sopenharmony_ci auto fslo = Sk2f(2.0f, -4.0f).abs(); 219cb93a386Sopenharmony_ci REPORTER_ASSERT(r, fshi[0] == 0.0f); 220cb93a386Sopenharmony_ci REPORTER_ASSERT(r, fshi[1] == 0.0f); 221cb93a386Sopenharmony_ci REPORTER_ASSERT(r, fslo[0] == 2.0f); 222cb93a386Sopenharmony_ci REPORTER_ASSERT(r, fslo[1] == 4.0f); 223cb93a386Sopenharmony_ci} 224cb93a386Sopenharmony_ci 225cb93a386Sopenharmony_ciDEF_TEST(Sk4i_abs, r) { 226cb93a386Sopenharmony_ci auto is = Sk4i(0, -1, 2, -2147483647).abs(); 227cb93a386Sopenharmony_ci REPORTER_ASSERT(r, is[0] == 0); 228cb93a386Sopenharmony_ci REPORTER_ASSERT(r, is[1] == 1); 229cb93a386Sopenharmony_ci REPORTER_ASSERT(r, is[2] == 2); 230cb93a386Sopenharmony_ci REPORTER_ASSERT(r, is[3] == 2147483647); 231cb93a386Sopenharmony_ci} 232cb93a386Sopenharmony_ci 233cb93a386Sopenharmony_ciDEF_TEST(Sk4i_minmax, r) { 234cb93a386Sopenharmony_ci auto a = Sk4i(0, 2, 4, 6); 235cb93a386Sopenharmony_ci auto b = Sk4i(1, 1, 3, 7); 236cb93a386Sopenharmony_ci auto min = Sk4i::Min(a, b); 237cb93a386Sopenharmony_ci auto max = Sk4i::Max(a, b); 238cb93a386Sopenharmony_ci for(int i = 0; i < 4; ++i) { 239cb93a386Sopenharmony_ci REPORTER_ASSERT(r, min[i] == std::min(a[i], b[i])); 240cb93a386Sopenharmony_ci REPORTER_ASSERT(r, max[i] == std::max(a[i], b[i])); 241cb93a386Sopenharmony_ci } 242cb93a386Sopenharmony_ci} 243cb93a386Sopenharmony_ci 244cb93a386Sopenharmony_ciDEF_TEST(SkNx_floor, r) { 245cb93a386Sopenharmony_ci auto fs = Sk4f(0.4f, -0.4f, 0.6f, -0.6f).floor(); 246cb93a386Sopenharmony_ci REPORTER_ASSERT(r, fs[0] == 0.0f); 247cb93a386Sopenharmony_ci REPORTER_ASSERT(r, fs[1] == -1.0f); 248cb93a386Sopenharmony_ci REPORTER_ASSERT(r, fs[2] == 0.0f); 249cb93a386Sopenharmony_ci REPORTER_ASSERT(r, fs[3] == -1.0f); 250cb93a386Sopenharmony_ci 251cb93a386Sopenharmony_ci auto fs2 = Sk2f(0.4f, -0.4f).floor(); 252cb93a386Sopenharmony_ci REPORTER_ASSERT(r, fs2[0] == 0.0f); 253cb93a386Sopenharmony_ci REPORTER_ASSERT(r, fs2[1] == -1.0f); 254cb93a386Sopenharmony_ci 255cb93a386Sopenharmony_ci auto fs3 = Sk2f(0.6f, -0.6f).floor(); 256cb93a386Sopenharmony_ci REPORTER_ASSERT(r, fs3[0] == 0.0f); 257cb93a386Sopenharmony_ci REPORTER_ASSERT(r, fs3[1] == -1.0f); 258cb93a386Sopenharmony_ci} 259cb93a386Sopenharmony_ci 260cb93a386Sopenharmony_ciDEF_TEST(SkNx_shuffle, r) { 261cb93a386Sopenharmony_ci Sk4f f4(0,10,20,30); 262cb93a386Sopenharmony_ci 263cb93a386Sopenharmony_ci Sk2f f2 = SkNx_shuffle<2,1>(f4); 264cb93a386Sopenharmony_ci REPORTER_ASSERT(r, f2[0] == 20); 265cb93a386Sopenharmony_ci REPORTER_ASSERT(r, f2[1] == 10); 266cb93a386Sopenharmony_ci 267cb93a386Sopenharmony_ci f4 = SkNx_shuffle<0,1,1,0>(f2); 268cb93a386Sopenharmony_ci REPORTER_ASSERT(r, f4[0] == 20); 269cb93a386Sopenharmony_ci REPORTER_ASSERT(r, f4[1] == 10); 270cb93a386Sopenharmony_ci REPORTER_ASSERT(r, f4[2] == 10); 271cb93a386Sopenharmony_ci REPORTER_ASSERT(r, f4[3] == 20); 272cb93a386Sopenharmony_ci} 273cb93a386Sopenharmony_ci 274cb93a386Sopenharmony_ciDEF_TEST(SkNx_int_float, r) { 275cb93a386Sopenharmony_ci Sk4f f(-2.3f, 1.0f, 0.45f, 0.6f); 276cb93a386Sopenharmony_ci 277cb93a386Sopenharmony_ci Sk4i i = SkNx_cast<int>(f); 278cb93a386Sopenharmony_ci REPORTER_ASSERT(r, i[0] == -2); 279cb93a386Sopenharmony_ci REPORTER_ASSERT(r, i[1] == 1); 280cb93a386Sopenharmony_ci REPORTER_ASSERT(r, i[2] == 0); 281cb93a386Sopenharmony_ci REPORTER_ASSERT(r, i[3] == 0); 282cb93a386Sopenharmony_ci 283cb93a386Sopenharmony_ci f = SkNx_cast<float>(i); 284cb93a386Sopenharmony_ci REPORTER_ASSERT(r, f[0] == -2.0f); 285cb93a386Sopenharmony_ci REPORTER_ASSERT(r, f[1] == 1.0f); 286cb93a386Sopenharmony_ci REPORTER_ASSERT(r, f[2] == 0.0f); 287cb93a386Sopenharmony_ci REPORTER_ASSERT(r, f[3] == 0.0f); 288cb93a386Sopenharmony_ci} 289cb93a386Sopenharmony_ci 290cb93a386Sopenharmony_ci#include "include/utils/SkRandom.h" 291cb93a386Sopenharmony_ci 292cb93a386Sopenharmony_ciDEF_TEST(SkNx_u16_float, r) { 293cb93a386Sopenharmony_ci { 294cb93a386Sopenharmony_ci // u16 --> float 295cb93a386Sopenharmony_ci auto h4 = Sk4h(15, 17, 257, 65535); 296cb93a386Sopenharmony_ci auto f4 = SkNx_cast<float>(h4); 297cb93a386Sopenharmony_ci REPORTER_ASSERT(r, f4[0] == 15.0f); 298cb93a386Sopenharmony_ci REPORTER_ASSERT(r, f4[1] == 17.0f); 299cb93a386Sopenharmony_ci REPORTER_ASSERT(r, f4[2] == 257.0f); 300cb93a386Sopenharmony_ci REPORTER_ASSERT(r, f4[3] == 65535.0f); 301cb93a386Sopenharmony_ci } 302cb93a386Sopenharmony_ci { 303cb93a386Sopenharmony_ci // float -> u16 304cb93a386Sopenharmony_ci auto f4 = Sk4f(15, 17, 257, 65535); 305cb93a386Sopenharmony_ci auto h4 = SkNx_cast<uint16_t>(f4); 306cb93a386Sopenharmony_ci REPORTER_ASSERT(r, h4[0] == 15); 307cb93a386Sopenharmony_ci REPORTER_ASSERT(r, h4[1] == 17); 308cb93a386Sopenharmony_ci REPORTER_ASSERT(r, h4[2] == 257); 309cb93a386Sopenharmony_ci REPORTER_ASSERT(r, h4[3] == 65535); 310cb93a386Sopenharmony_ci } 311cb93a386Sopenharmony_ci 312cb93a386Sopenharmony_ci // starting with any u16 value, we should be able to have a perfect round-trip in/out of floats 313cb93a386Sopenharmony_ci // 314cb93a386Sopenharmony_ci SkRandom rand; 315cb93a386Sopenharmony_ci for (int i = 0; i < 10000; ++i) { 316cb93a386Sopenharmony_ci const uint16_t s16[4] { 317cb93a386Sopenharmony_ci (uint16_t)(rand.nextU() >> 16), (uint16_t)(rand.nextU() >> 16), 318cb93a386Sopenharmony_ci (uint16_t)(rand.nextU() >> 16), (uint16_t)(rand.nextU() >> 16), 319cb93a386Sopenharmony_ci }; 320cb93a386Sopenharmony_ci auto u4_0 = Sk4h::Load(s16); 321cb93a386Sopenharmony_ci auto f4 = SkNx_cast<float>(u4_0); 322cb93a386Sopenharmony_ci auto u4_1 = SkNx_cast<uint16_t>(f4); 323cb93a386Sopenharmony_ci uint16_t d16[4]; 324cb93a386Sopenharmony_ci u4_1.store(d16); 325cb93a386Sopenharmony_ci REPORTER_ASSERT(r, !memcmp(s16, d16, sizeof(s16))); 326cb93a386Sopenharmony_ci } 327cb93a386Sopenharmony_ci} 328cb93a386Sopenharmony_ci 329cb93a386Sopenharmony_ci// The SSE2 implementation of SkNx_cast<uint16_t>(Sk4i) is non-trivial, so worth a test. 330cb93a386Sopenharmony_ciDEF_TEST(SkNx_int_u16, r) { 331cb93a386Sopenharmony_ci // These are pretty hard to get wrong. 332cb93a386Sopenharmony_ci for (int i = 0; i <= 0x7fff; i++) { 333cb93a386Sopenharmony_ci uint16_t expected = (uint16_t)i; 334cb93a386Sopenharmony_ci uint16_t actual = SkNx_cast<uint16_t>(Sk4i(i))[0]; 335cb93a386Sopenharmony_ci 336cb93a386Sopenharmony_ci REPORTER_ASSERT(r, expected == actual); 337cb93a386Sopenharmony_ci } 338cb93a386Sopenharmony_ci 339cb93a386Sopenharmony_ci // A naive implementation with _mm_packs_epi32 would succeed up to 0x7fff but fail here: 340cb93a386Sopenharmony_ci for (int i = 0x8000; (1) && i <= 0xffff; i++) { 341cb93a386Sopenharmony_ci uint16_t expected = (uint16_t)i; 342cb93a386Sopenharmony_ci uint16_t actual = SkNx_cast<uint16_t>(Sk4i(i))[0]; 343cb93a386Sopenharmony_ci 344cb93a386Sopenharmony_ci REPORTER_ASSERT(r, expected == actual); 345cb93a386Sopenharmony_ci } 346cb93a386Sopenharmony_ci} 347cb93a386Sopenharmony_ci 348cb93a386Sopenharmony_ciDEF_TEST(SkNx_4fLoad4Store4, r) { 349cb93a386Sopenharmony_ci float src[] = { 350cb93a386Sopenharmony_ci 0.0f, 1.0f, 2.0f, 3.0f, 351cb93a386Sopenharmony_ci 4.0f, 5.0f, 6.0f, 7.0f, 352cb93a386Sopenharmony_ci 8.0f, 9.0f, 10.0f, 11.0f, 353cb93a386Sopenharmony_ci 12.0f, 13.0f, 14.0f, 15.0f 354cb93a386Sopenharmony_ci }; 355cb93a386Sopenharmony_ci 356cb93a386Sopenharmony_ci Sk4f a, b, c, d; 357cb93a386Sopenharmony_ci Sk4f::Load4(src, &a, &b, &c, &d); 358cb93a386Sopenharmony_ci REPORTER_ASSERT(r, 0.0f == a[0]); 359cb93a386Sopenharmony_ci REPORTER_ASSERT(r, 4.0f == a[1]); 360cb93a386Sopenharmony_ci REPORTER_ASSERT(r, 8.0f == a[2]); 361cb93a386Sopenharmony_ci REPORTER_ASSERT(r, 12.0f == a[3]); 362cb93a386Sopenharmony_ci REPORTER_ASSERT(r, 1.0f == b[0]); 363cb93a386Sopenharmony_ci REPORTER_ASSERT(r, 5.0f == b[1]); 364cb93a386Sopenharmony_ci REPORTER_ASSERT(r, 9.0f == b[2]); 365cb93a386Sopenharmony_ci REPORTER_ASSERT(r, 13.0f == b[3]); 366cb93a386Sopenharmony_ci REPORTER_ASSERT(r, 2.0f == c[0]); 367cb93a386Sopenharmony_ci REPORTER_ASSERT(r, 6.0f == c[1]); 368cb93a386Sopenharmony_ci REPORTER_ASSERT(r, 10.0f == c[2]); 369cb93a386Sopenharmony_ci REPORTER_ASSERT(r, 14.0f == c[3]); 370cb93a386Sopenharmony_ci REPORTER_ASSERT(r, 3.0f == d[0]); 371cb93a386Sopenharmony_ci REPORTER_ASSERT(r, 7.0f == d[1]); 372cb93a386Sopenharmony_ci REPORTER_ASSERT(r, 11.0f == d[2]); 373cb93a386Sopenharmony_ci REPORTER_ASSERT(r, 15.0f == d[3]); 374cb93a386Sopenharmony_ci 375cb93a386Sopenharmony_ci float dst[16]; 376cb93a386Sopenharmony_ci Sk4f::Store4(dst, a, b, c, d); 377cb93a386Sopenharmony_ci REPORTER_ASSERT(r, 0 == memcmp(dst, src, 16 * sizeof(float))); 378cb93a386Sopenharmony_ci} 379cb93a386Sopenharmony_ci 380cb93a386Sopenharmony_ciDEF_TEST(SkNx_neg, r) { 381cb93a386Sopenharmony_ci auto fs = -Sk4f(0.0f, -0.0f, 2.0f, -4.0f); 382cb93a386Sopenharmony_ci REPORTER_ASSERT(r, fs[0] == 0.0f); 383cb93a386Sopenharmony_ci REPORTER_ASSERT(r, fs[1] == 0.0f); 384cb93a386Sopenharmony_ci REPORTER_ASSERT(r, fs[2] == -2.0f); 385cb93a386Sopenharmony_ci REPORTER_ASSERT(r, fs[3] == 4.0f); 386cb93a386Sopenharmony_ci auto fshi = -Sk2f(0.0f, -0.0f); 387cb93a386Sopenharmony_ci auto fslo = -Sk2f(2.0f, -4.0f); 388cb93a386Sopenharmony_ci REPORTER_ASSERT(r, fshi[0] == 0.0f); 389cb93a386Sopenharmony_ci REPORTER_ASSERT(r, fshi[1] == 0.0f); 390cb93a386Sopenharmony_ci REPORTER_ASSERT(r, fslo[0] == -2.0f); 391cb93a386Sopenharmony_ci REPORTER_ASSERT(r, fslo[1] == 4.0f); 392cb93a386Sopenharmony_ci} 393cb93a386Sopenharmony_ci 394cb93a386Sopenharmony_ciDEF_TEST(SkNx_thenElse, r) { 395cb93a386Sopenharmony_ci auto fs = (Sk4f(0.0f, -0.0f, 2.0f, -4.0f) < 0).thenElse(-1, 1); 396cb93a386Sopenharmony_ci REPORTER_ASSERT(r, fs[0] == 1); 397cb93a386Sopenharmony_ci REPORTER_ASSERT(r, fs[1] == 1); 398cb93a386Sopenharmony_ci REPORTER_ASSERT(r, fs[2] == 1); 399cb93a386Sopenharmony_ci REPORTER_ASSERT(r, fs[3] == -1); 400cb93a386Sopenharmony_ci auto fshi = (Sk2f(0.0f, -0.0f) < 0).thenElse(-1, 1); 401cb93a386Sopenharmony_ci auto fslo = (Sk2f(2.0f, -4.0f) < 0).thenElse(-1, 1); 402cb93a386Sopenharmony_ci REPORTER_ASSERT(r, fshi[0] == 1); 403cb93a386Sopenharmony_ci REPORTER_ASSERT(r, fshi[1] == 1); 404cb93a386Sopenharmony_ci REPORTER_ASSERT(r, fslo[0] == 1); 405cb93a386Sopenharmony_ci REPORTER_ASSERT(r, fslo[1] == -1); 406cb93a386Sopenharmony_ci} 407cb93a386Sopenharmony_ci 408cb93a386Sopenharmony_ciDEF_TEST(Sk4f_Load2, r) { 409cb93a386Sopenharmony_ci float xy[8] = { 0,1,2,3,4,5,6,7 }; 410cb93a386Sopenharmony_ci 411cb93a386Sopenharmony_ci Sk4f x,y; 412cb93a386Sopenharmony_ci Sk4f::Load2(xy, &x,&y); 413cb93a386Sopenharmony_ci 414cb93a386Sopenharmony_ci REPORTER_ASSERT(r, x[0] == 0); 415cb93a386Sopenharmony_ci REPORTER_ASSERT(r, x[1] == 2); 416cb93a386Sopenharmony_ci REPORTER_ASSERT(r, x[2] == 4); 417cb93a386Sopenharmony_ci REPORTER_ASSERT(r, x[3] == 6); 418cb93a386Sopenharmony_ci 419cb93a386Sopenharmony_ci REPORTER_ASSERT(r, y[0] == 1); 420cb93a386Sopenharmony_ci REPORTER_ASSERT(r, y[1] == 3); 421cb93a386Sopenharmony_ci REPORTER_ASSERT(r, y[2] == 5); 422cb93a386Sopenharmony_ci REPORTER_ASSERT(r, y[3] == 7); 423cb93a386Sopenharmony_ci} 424cb93a386Sopenharmony_ci 425cb93a386Sopenharmony_ciDEF_TEST(Sk2f_Load2, r) { 426cb93a386Sopenharmony_ci float xy[4] = { 0,1,2,3 }; 427cb93a386Sopenharmony_ci 428cb93a386Sopenharmony_ci Sk2f x,y; 429cb93a386Sopenharmony_ci Sk2f::Load2(xy, &x,&y); 430cb93a386Sopenharmony_ci 431cb93a386Sopenharmony_ci REPORTER_ASSERT(r, x[0] == 0); 432cb93a386Sopenharmony_ci REPORTER_ASSERT(r, x[1] == 2); 433cb93a386Sopenharmony_ci 434cb93a386Sopenharmony_ci REPORTER_ASSERT(r, y[0] == 1); 435cb93a386Sopenharmony_ci REPORTER_ASSERT(r, y[1] == 3); 436cb93a386Sopenharmony_ci} 437cb93a386Sopenharmony_ci 438cb93a386Sopenharmony_ciDEF_TEST(Sk2f_Store2, r) { 439cb93a386Sopenharmony_ci Sk2f p0{0, 2}; 440cb93a386Sopenharmony_ci Sk2f p1{1, 3}; 441cb93a386Sopenharmony_ci float dst[4]; 442cb93a386Sopenharmony_ci Sk2f::Store2(dst, p0, p1); 443cb93a386Sopenharmony_ci REPORTER_ASSERT(r, dst[0] == 0); 444cb93a386Sopenharmony_ci REPORTER_ASSERT(r, dst[1] == 1); 445cb93a386Sopenharmony_ci REPORTER_ASSERT(r, dst[2] == 2); 446cb93a386Sopenharmony_ci REPORTER_ASSERT(r, dst[3] == 3); 447cb93a386Sopenharmony_ci} 448cb93a386Sopenharmony_ci 449cb93a386Sopenharmony_ciDEF_TEST(Sk2f_Store3, r) { 450cb93a386Sopenharmony_ci Sk2f p0{0, 3}; 451cb93a386Sopenharmony_ci Sk2f p1{1, 4}; 452cb93a386Sopenharmony_ci Sk2f p2{2, 5}; 453cb93a386Sopenharmony_ci float dst[6]; 454cb93a386Sopenharmony_ci Sk2f::Store3(dst, p0, p1, p2); 455cb93a386Sopenharmony_ci REPORTER_ASSERT(r, dst[0] == 0); 456cb93a386Sopenharmony_ci REPORTER_ASSERT(r, dst[1] == 1); 457cb93a386Sopenharmony_ci REPORTER_ASSERT(r, dst[2] == 2); 458cb93a386Sopenharmony_ci REPORTER_ASSERT(r, dst[3] == 3); 459cb93a386Sopenharmony_ci REPORTER_ASSERT(r, dst[4] == 4); 460cb93a386Sopenharmony_ci REPORTER_ASSERT(r, dst[5] == 5); 461cb93a386Sopenharmony_ci} 462cb93a386Sopenharmony_ci 463cb93a386Sopenharmony_ciDEF_TEST(Sk2f_Store4, r) { 464cb93a386Sopenharmony_ci Sk2f p0{0, 4}; 465cb93a386Sopenharmony_ci Sk2f p1{1, 5}; 466cb93a386Sopenharmony_ci Sk2f p2{2, 6}; 467cb93a386Sopenharmony_ci Sk2f p3{3, 7}; 468cb93a386Sopenharmony_ci 469cb93a386Sopenharmony_ci float dst[8] = {-1, -1, -1, -1, -1, -1, -1, -1}; 470cb93a386Sopenharmony_ci Sk2f::Store4(dst, p0, p1, p2, p3); 471cb93a386Sopenharmony_ci REPORTER_ASSERT(r, dst[0] == 0); 472cb93a386Sopenharmony_ci REPORTER_ASSERT(r, dst[1] == 1); 473cb93a386Sopenharmony_ci REPORTER_ASSERT(r, dst[2] == 2); 474cb93a386Sopenharmony_ci REPORTER_ASSERT(r, dst[3] == 3); 475cb93a386Sopenharmony_ci REPORTER_ASSERT(r, dst[4] == 4); 476cb93a386Sopenharmony_ci REPORTER_ASSERT(r, dst[5] == 5); 477cb93a386Sopenharmony_ci REPORTER_ASSERT(r, dst[6] == 6); 478cb93a386Sopenharmony_ci REPORTER_ASSERT(r, dst[7] == 7); 479cb93a386Sopenharmony_ci 480cb93a386Sopenharmony_ci // Ensure transposing to Sk4f works. 481cb93a386Sopenharmony_ci Sk4f dst4f[2] = {{-1, -1, -1, -1}, {-1, -1, -1, -1}}; 482cb93a386Sopenharmony_ci Sk2f::Store4(dst4f, p0, p1, p2, p3); 483cb93a386Sopenharmony_ci REPORTER_ASSERT(r, dst4f[0][0] == 0); 484cb93a386Sopenharmony_ci REPORTER_ASSERT(r, dst4f[0][1] == 1); 485cb93a386Sopenharmony_ci REPORTER_ASSERT(r, dst4f[0][2] == 2); 486cb93a386Sopenharmony_ci REPORTER_ASSERT(r, dst4f[0][3] == 3); 487cb93a386Sopenharmony_ci REPORTER_ASSERT(r, dst4f[1][0] == 4); 488cb93a386Sopenharmony_ci REPORTER_ASSERT(r, dst4f[1][1] == 5); 489cb93a386Sopenharmony_ci REPORTER_ASSERT(r, dst4f[1][2] == 6); 490cb93a386Sopenharmony_ci REPORTER_ASSERT(r, dst4f[1][3] == 7); 491cb93a386Sopenharmony_ci 492cb93a386Sopenharmony_ci} 493cb93a386Sopenharmony_ci 494cb93a386Sopenharmony_ciDEF_TEST(Sk4f_minmax, r) { 495cb93a386Sopenharmony_ci REPORTER_ASSERT(r, 3 == Sk4f(0,1,2,3).max()); 496cb93a386Sopenharmony_ci REPORTER_ASSERT(r, 2 == Sk4f(1,-5,2,-1).max()); 497cb93a386Sopenharmony_ci REPORTER_ASSERT(r, -1 == Sk4f(-2,-1,-6,-3).max()); 498cb93a386Sopenharmony_ci REPORTER_ASSERT(r, 3 == Sk4f(3,2,1,0).max()); 499cb93a386Sopenharmony_ci 500cb93a386Sopenharmony_ci REPORTER_ASSERT(r, 0 == Sk4f(0,1,2,3).min()); 501cb93a386Sopenharmony_ci REPORTER_ASSERT(r, -5 == Sk4f(1,-5,2,-1).min()); 502cb93a386Sopenharmony_ci REPORTER_ASSERT(r, -6 == Sk4f(-2,-1,-6,-3).min()); 503cb93a386Sopenharmony_ci REPORTER_ASSERT(r, 0 == Sk4f(3,2,1,0).min()); 504cb93a386Sopenharmony_ci} 505cb93a386Sopenharmony_ci 506cb93a386Sopenharmony_ciDEF_TEST(SkNf_anyTrue_allTrue, r) { 507cb93a386Sopenharmony_ci REPORTER_ASSERT(r, (Sk2f{1,2} < Sk2f{3,4}).anyTrue()); 508cb93a386Sopenharmony_ci REPORTER_ASSERT(r, (Sk2f{1,2} < Sk2f{3,4}).allTrue()); 509cb93a386Sopenharmony_ci REPORTER_ASSERT(r, (Sk2f{3,2} < Sk2f{1,4}).anyTrue()); 510cb93a386Sopenharmony_ci REPORTER_ASSERT(r, !(Sk2f{3,2} < Sk2f{1,4}).allTrue()); 511cb93a386Sopenharmony_ci REPORTER_ASSERT(r, !(Sk2f{3,4} < Sk2f{1,2}).anyTrue()); 512cb93a386Sopenharmony_ci 513cb93a386Sopenharmony_ci REPORTER_ASSERT(r, (Sk4f{1,2,3,4} < Sk4f{3,4,5,6}).anyTrue()); 514cb93a386Sopenharmony_ci REPORTER_ASSERT(r, (Sk4f{1,2,3,4} < Sk4f{3,4,5,6}).allTrue()); 515cb93a386Sopenharmony_ci REPORTER_ASSERT(r, (Sk4f{1,2,3,4} < Sk4f{1,4,1,1}).anyTrue()); 516cb93a386Sopenharmony_ci REPORTER_ASSERT(r, !(Sk4f{1,2,3,4} < Sk4f{1,4,1,1}).allTrue()); 517cb93a386Sopenharmony_ci REPORTER_ASSERT(r, !(Sk4f{3,4,5,6} < Sk4f{1,2,3,4}).anyTrue()); 518cb93a386Sopenharmony_ci} 519