1cb93a386Sopenharmony_ci/*
2cb93a386Sopenharmony_ci * Copyright 2015 Google Inc.
3cb93a386Sopenharmony_ci *
4cb93a386Sopenharmony_ci * Use of this source code is governed by a BSD-style license that can be
5cb93a386Sopenharmony_ci * found in the LICENSE file.
6cb93a386Sopenharmony_ci */
7cb93a386Sopenharmony_ci
8cb93a386Sopenharmony_ci#include "include/private/SkNx.h"
9cb93a386Sopenharmony_ci#include "include/utils/SkRandom.h"
10cb93a386Sopenharmony_ci#include "src/core/Sk4px.h"
11cb93a386Sopenharmony_ci#include "tests/Test.h"
12cb93a386Sopenharmony_ci
13cb93a386Sopenharmony_citemplate <int N>
14cb93a386Sopenharmony_cistatic void test_Nf(skiatest::Reporter* r) {
15cb93a386Sopenharmony_ci
16cb93a386Sopenharmony_ci    auto assert_nearly_eq = [&](float eps, const SkNx<N, float>& v,
17cb93a386Sopenharmony_ci                                float a, float b, float c, float d) {
18cb93a386Sopenharmony_ci        auto close = [=](float a, float b) { return fabsf(a-b) <= eps; };
19cb93a386Sopenharmony_ci        float vals[4];
20cb93a386Sopenharmony_ci        v.store(vals);
21cb93a386Sopenharmony_ci        bool ok = close(vals[0], a) && close(vals[1], b)
22cb93a386Sopenharmony_ci               && close(   v[0], a) && close(   v[1], b);
23cb93a386Sopenharmony_ci        REPORTER_ASSERT(r, ok);
24cb93a386Sopenharmony_ci        if (N == 4) {
25cb93a386Sopenharmony_ci            ok = close(vals[2], c) && close(vals[3], d)
26cb93a386Sopenharmony_ci              && close(   v[2], c) && close(   v[3], d);
27cb93a386Sopenharmony_ci            REPORTER_ASSERT(r, ok);
28cb93a386Sopenharmony_ci        }
29cb93a386Sopenharmony_ci    };
30cb93a386Sopenharmony_ci    auto assert_eq = [&](const SkNx<N, float>& v, float a, float b, float c, float d) {
31cb93a386Sopenharmony_ci        return assert_nearly_eq(0, v, a,b,c,d);
32cb93a386Sopenharmony_ci    };
33cb93a386Sopenharmony_ci
34cb93a386Sopenharmony_ci    float vals[] = {3, 4, 5, 6};
35cb93a386Sopenharmony_ci    SkNx<N,float> a = SkNx<N,float>::Load(vals),
36cb93a386Sopenharmony_ci                  b(a),
37cb93a386Sopenharmony_ci                  c = a;
38cb93a386Sopenharmony_ci    SkNx<N,float> d;
39cb93a386Sopenharmony_ci    d = a;
40cb93a386Sopenharmony_ci
41cb93a386Sopenharmony_ci    assert_eq(a, 3, 4, 5, 6);
42cb93a386Sopenharmony_ci    assert_eq(b, 3, 4, 5, 6);
43cb93a386Sopenharmony_ci    assert_eq(c, 3, 4, 5, 6);
44cb93a386Sopenharmony_ci    assert_eq(d, 3, 4, 5, 6);
45cb93a386Sopenharmony_ci
46cb93a386Sopenharmony_ci    assert_eq(a+b, 6, 8, 10, 12);
47cb93a386Sopenharmony_ci    assert_eq(a*b, 9, 16, 25, 36);
48cb93a386Sopenharmony_ci    assert_eq(a*b-b, 6, 12, 20, 30);
49cb93a386Sopenharmony_ci    assert_eq((a*b).sqrt(), 3, 4, 5, 6);
50cb93a386Sopenharmony_ci    assert_eq(a/b, 1, 1, 1, 1);
51cb93a386Sopenharmony_ci    assert_eq(SkNx<N,float>(0)-a, -3, -4, -5, -6);
52cb93a386Sopenharmony_ci
53cb93a386Sopenharmony_ci    SkNx<N,float> fours(4);
54cb93a386Sopenharmony_ci
55cb93a386Sopenharmony_ci    assert_eq(fours.sqrt(), 2,2,2,2);
56cb93a386Sopenharmony_ci
57cb93a386Sopenharmony_ci    assert_eq(SkNx<N,float>::Min(a, fours), 3, 4, 4, 4);
58cb93a386Sopenharmony_ci    assert_eq(SkNx<N,float>::Max(a, fours), 4, 4, 5, 6);
59cb93a386Sopenharmony_ci
60cb93a386Sopenharmony_ci    // Test some comparisons.  This is not exhaustive.
61cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, (a == b).allTrue());
62cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, (a+b == a*b-b).anyTrue());
63cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, !(a+b == a*b-b).allTrue());
64cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, !(a+b == a*b).anyTrue());
65cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, !(a != b).anyTrue());
66cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, (a < fours).anyTrue());
67cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, (a <= fours).anyTrue());
68cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, !(a > fours).allTrue());
69cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, !(a >= fours).allTrue());
70cb93a386Sopenharmony_ci}
71cb93a386Sopenharmony_ci
72cb93a386Sopenharmony_ciDEF_TEST(SkNf, r) {
73cb93a386Sopenharmony_ci    test_Nf<2>(r);
74cb93a386Sopenharmony_ci    test_Nf<4>(r);
75cb93a386Sopenharmony_ci}
76cb93a386Sopenharmony_ci
77cb93a386Sopenharmony_citemplate <int N, typename T>
78cb93a386Sopenharmony_civoid test_Ni(skiatest::Reporter* r) {
79cb93a386Sopenharmony_ci    auto assert_eq = [&](const SkNx<N,T>& v, T a, T b, T c, T d, T e, T f, T g, T h) {
80cb93a386Sopenharmony_ci        T vals[8];
81cb93a386Sopenharmony_ci        v.store(vals);
82cb93a386Sopenharmony_ci
83cb93a386Sopenharmony_ci        switch (N) {
84cb93a386Sopenharmony_ci            case 8:
85cb93a386Sopenharmony_ci                REPORTER_ASSERT(r, vals[4] == e && vals[5] == f && vals[6] == g && vals[7] == h);
86cb93a386Sopenharmony_ci                [[fallthrough]];
87cb93a386Sopenharmony_ci            case 4:
88cb93a386Sopenharmony_ci                REPORTER_ASSERT(r, vals[2] == c && vals[3] == d);
89cb93a386Sopenharmony_ci                [[fallthrough]];
90cb93a386Sopenharmony_ci            case 2:
91cb93a386Sopenharmony_ci                REPORTER_ASSERT(r, vals[0] == a && vals[1] == b);
92cb93a386Sopenharmony_ci        }
93cb93a386Sopenharmony_ci        switch (N) {
94cb93a386Sopenharmony_ci            case 8:
95cb93a386Sopenharmony_ci                REPORTER_ASSERT(r, v[4] == e && v[5] == f && v[6] == g && v[7] == h);
96cb93a386Sopenharmony_ci                [[fallthrough]];
97cb93a386Sopenharmony_ci            case 4:
98cb93a386Sopenharmony_ci                REPORTER_ASSERT(r, v[2] == c && v[3] == d);
99cb93a386Sopenharmony_ci                [[fallthrough]];
100cb93a386Sopenharmony_ci            case 2:
101cb93a386Sopenharmony_ci                REPORTER_ASSERT(r, v[0] == a && v[1] == b);
102cb93a386Sopenharmony_ci        }
103cb93a386Sopenharmony_ci    };
104cb93a386Sopenharmony_ci
105cb93a386Sopenharmony_ci    T vals[] = { 1,2,3,4,5,6,7,8 };
106cb93a386Sopenharmony_ci    SkNx<N,T> a = SkNx<N,T>::Load(vals),
107cb93a386Sopenharmony_ci              b(a),
108cb93a386Sopenharmony_ci              c = a;
109cb93a386Sopenharmony_ci    SkNx<N,T> d;
110cb93a386Sopenharmony_ci    d = a;
111cb93a386Sopenharmony_ci
112cb93a386Sopenharmony_ci    assert_eq(a, 1,2,3,4,5,6,7,8);
113cb93a386Sopenharmony_ci    assert_eq(b, 1,2,3,4,5,6,7,8);
114cb93a386Sopenharmony_ci    assert_eq(c, 1,2,3,4,5,6,7,8);
115cb93a386Sopenharmony_ci    assert_eq(d, 1,2,3,4,5,6,7,8);
116cb93a386Sopenharmony_ci
117cb93a386Sopenharmony_ci    assert_eq(a+a, 2,4,6,8,10,12,14,16);
118cb93a386Sopenharmony_ci    assert_eq(a*a, 1,4,9,16,25,36,49,64);
119cb93a386Sopenharmony_ci    assert_eq(a*a-a, 0,2,6,12,20,30,42,56);
120cb93a386Sopenharmony_ci
121cb93a386Sopenharmony_ci    assert_eq(a >> 2, 0,0,0,1,1,1,1,2);
122cb93a386Sopenharmony_ci    assert_eq(a << 1, 2,4,6,8,10,12,14,16);
123cb93a386Sopenharmony_ci
124cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, a[1] == 2);
125cb93a386Sopenharmony_ci}
126cb93a386Sopenharmony_ci
127cb93a386Sopenharmony_ciDEF_TEST(SkNx, r) {
128cb93a386Sopenharmony_ci    test_Ni<2, uint16_t>(r);
129cb93a386Sopenharmony_ci    test_Ni<4, uint16_t>(r);
130cb93a386Sopenharmony_ci    test_Ni<8, uint16_t>(r);
131cb93a386Sopenharmony_ci
132cb93a386Sopenharmony_ci    test_Ni<2, int>(r);
133cb93a386Sopenharmony_ci    test_Ni<4, int>(r);
134cb93a386Sopenharmony_ci    test_Ni<8, int>(r);
135cb93a386Sopenharmony_ci}
136cb93a386Sopenharmony_ci
137cb93a386Sopenharmony_ciDEF_TEST(SkNi_min_lt, r) {
138cb93a386Sopenharmony_ci    // Exhaustively check the 8x8 bit space.
139cb93a386Sopenharmony_ci    for (int a = 0; a < (1<<8); a++) {
140cb93a386Sopenharmony_ci    for (int b = 0; b < (1<<8); b++) {
141cb93a386Sopenharmony_ci        Sk16b aw(a), bw(b);
142cb93a386Sopenharmony_ci        REPORTER_ASSERT(r, Sk16b::Min(aw, bw)[0] == std::min(a, b));
143cb93a386Sopenharmony_ci        REPORTER_ASSERT(r, !(aw < bw)[0] == !(a < b));
144cb93a386Sopenharmony_ci    }}
145cb93a386Sopenharmony_ci
146cb93a386Sopenharmony_ci    // Exhausting the 16x16 bit space is kind of slow, so only do that in release builds.
147cb93a386Sopenharmony_ci#ifdef SK_DEBUG
148cb93a386Sopenharmony_ci    SkRandom rand;
149cb93a386Sopenharmony_ci    for (int i = 0; i < (1<<16); i++) {
150cb93a386Sopenharmony_ci        uint16_t a = rand.nextU() >> 16,
151cb93a386Sopenharmony_ci                 b = rand.nextU() >> 16;
152cb93a386Sopenharmony_ci        REPORTER_ASSERT(r, Sk16h::Min(Sk16h(a), Sk16h(b))[0] == std::min(a, b));
153cb93a386Sopenharmony_ci    }
154cb93a386Sopenharmony_ci#else
155cb93a386Sopenharmony_ci    for (int a = 0; a < (1<<16); a++) {
156cb93a386Sopenharmony_ci    for (int b = 0; b < (1<<16); b++) {
157cb93a386Sopenharmony_ci        REPORTER_ASSERT(r, Sk16h::Min(Sk16h(a), Sk16h(b))[0] == std::min(a, b));
158cb93a386Sopenharmony_ci    }}
159cb93a386Sopenharmony_ci#endif
160cb93a386Sopenharmony_ci}
161cb93a386Sopenharmony_ci
162cb93a386Sopenharmony_ciDEF_TEST(SkNi_saturatedAdd, r) {
163cb93a386Sopenharmony_ci    for (int a = 0; a < (1<<8); a++) {
164cb93a386Sopenharmony_ci    for (int b = 0; b < (1<<8); b++) {
165cb93a386Sopenharmony_ci        int exact = a+b;
166cb93a386Sopenharmony_ci        if (exact > 255) { exact = 255; }
167cb93a386Sopenharmony_ci        if (exact <   0) { exact =   0; }
168cb93a386Sopenharmony_ci
169cb93a386Sopenharmony_ci        REPORTER_ASSERT(r, Sk16b(a).saturatedAdd(Sk16b(b))[0] == exact);
170cb93a386Sopenharmony_ci    }
171cb93a386Sopenharmony_ci    }
172cb93a386Sopenharmony_ci}
173cb93a386Sopenharmony_ci
174cb93a386Sopenharmony_ciDEF_TEST(SkNi_mulHi, r) {
175cb93a386Sopenharmony_ci    // First 8 primes.
176cb93a386Sopenharmony_ci    Sk4u a{ 0x00020000, 0x00030000, 0x00050000, 0x00070000 };
177cb93a386Sopenharmony_ci    Sk4u b{ 0x000b0000, 0x000d0000, 0x00110000, 0x00130000 };
178cb93a386Sopenharmony_ci
179cb93a386Sopenharmony_ci    Sk4u q{22, 39, 85, 133};
180cb93a386Sopenharmony_ci
181cb93a386Sopenharmony_ci    Sk4u c = a.mulHi(b);
182cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, c[0] == q[0]);
183cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, c[1] == q[1]);
184cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, c[2] == q[2]);
185cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, c[3] == q[3]);
186cb93a386Sopenharmony_ci}
187cb93a386Sopenharmony_ci
188cb93a386Sopenharmony_ciDEF_TEST(Sk4px_muldiv255round, r) {
189cb93a386Sopenharmony_ci    for (int a = 0; a < (1<<8); a++) {
190cb93a386Sopenharmony_ci    for (int b = 0; b < (1<<8); b++) {
191cb93a386Sopenharmony_ci        int exact = (a*b+127)/255;
192cb93a386Sopenharmony_ci
193cb93a386Sopenharmony_ci        // Duplicate a and b 16x each.
194cb93a386Sopenharmony_ci        Sk4px av = Sk16b(a),
195cb93a386Sopenharmony_ci              bv = Sk16b(b);
196cb93a386Sopenharmony_ci
197cb93a386Sopenharmony_ci        // This way should always be exactly correct.
198cb93a386Sopenharmony_ci        int correct = (av * bv).div255()[0];
199cb93a386Sopenharmony_ci        REPORTER_ASSERT(r, correct == exact);
200cb93a386Sopenharmony_ci
201cb93a386Sopenharmony_ci        // We're a bit more flexible on this method: correct for 0 or 255, otherwise off by <=1.
202cb93a386Sopenharmony_ci        int fast = av.approxMulDiv255(bv)[0];
203cb93a386Sopenharmony_ci        REPORTER_ASSERT(r, fast-exact >= -1 && fast-exact <= 1);
204cb93a386Sopenharmony_ci        if (a == 0 || a == 255 || b == 0 || b == 255) {
205cb93a386Sopenharmony_ci            REPORTER_ASSERT(r, fast == exact);
206cb93a386Sopenharmony_ci        }
207cb93a386Sopenharmony_ci    }
208cb93a386Sopenharmony_ci    }
209cb93a386Sopenharmony_ci}
210cb93a386Sopenharmony_ci
211cb93a386Sopenharmony_ciDEF_TEST(SkNx_abs, r) {
212cb93a386Sopenharmony_ci    auto fs = Sk4f(0.0f, -0.0f, 2.0f, -4.0f).abs();
213cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, fs[0] == 0.0f);
214cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, fs[1] == 0.0f);
215cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, fs[2] == 2.0f);
216cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, fs[3] == 4.0f);
217cb93a386Sopenharmony_ci    auto fshi = Sk2f(0.0f, -0.0f).abs();
218cb93a386Sopenharmony_ci    auto fslo = Sk2f(2.0f, -4.0f).abs();
219cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, fshi[0] == 0.0f);
220cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, fshi[1] == 0.0f);
221cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, fslo[0] == 2.0f);
222cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, fslo[1] == 4.0f);
223cb93a386Sopenharmony_ci}
224cb93a386Sopenharmony_ci
225cb93a386Sopenharmony_ciDEF_TEST(Sk4i_abs, r) {
226cb93a386Sopenharmony_ci    auto is = Sk4i(0, -1, 2, -2147483647).abs();
227cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, is[0] == 0);
228cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, is[1] == 1);
229cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, is[2] == 2);
230cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, is[3] == 2147483647);
231cb93a386Sopenharmony_ci}
232cb93a386Sopenharmony_ci
233cb93a386Sopenharmony_ciDEF_TEST(Sk4i_minmax, r) {
234cb93a386Sopenharmony_ci    auto a = Sk4i(0, 2, 4, 6);
235cb93a386Sopenharmony_ci    auto b = Sk4i(1, 1, 3, 7);
236cb93a386Sopenharmony_ci    auto min = Sk4i::Min(a, b);
237cb93a386Sopenharmony_ci    auto max = Sk4i::Max(a, b);
238cb93a386Sopenharmony_ci    for(int i = 0; i < 4; ++i) {
239cb93a386Sopenharmony_ci        REPORTER_ASSERT(r, min[i] == std::min(a[i], b[i]));
240cb93a386Sopenharmony_ci        REPORTER_ASSERT(r, max[i] == std::max(a[i], b[i]));
241cb93a386Sopenharmony_ci    }
242cb93a386Sopenharmony_ci}
243cb93a386Sopenharmony_ci
244cb93a386Sopenharmony_ciDEF_TEST(SkNx_floor, r) {
245cb93a386Sopenharmony_ci    auto fs = Sk4f(0.4f, -0.4f, 0.6f, -0.6f).floor();
246cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, fs[0] ==  0.0f);
247cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, fs[1] == -1.0f);
248cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, fs[2] ==  0.0f);
249cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, fs[3] == -1.0f);
250cb93a386Sopenharmony_ci
251cb93a386Sopenharmony_ci    auto fs2 = Sk2f(0.4f, -0.4f).floor();
252cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, fs2[0] ==  0.0f);
253cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, fs2[1] == -1.0f);
254cb93a386Sopenharmony_ci
255cb93a386Sopenharmony_ci    auto fs3 = Sk2f(0.6f, -0.6f).floor();
256cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, fs3[0] ==  0.0f);
257cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, fs3[1] == -1.0f);
258cb93a386Sopenharmony_ci}
259cb93a386Sopenharmony_ci
260cb93a386Sopenharmony_ciDEF_TEST(SkNx_shuffle, r) {
261cb93a386Sopenharmony_ci    Sk4f f4(0,10,20,30);
262cb93a386Sopenharmony_ci
263cb93a386Sopenharmony_ci    Sk2f f2 = SkNx_shuffle<2,1>(f4);
264cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, f2[0] == 20);
265cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, f2[1] == 10);
266cb93a386Sopenharmony_ci
267cb93a386Sopenharmony_ci    f4 = SkNx_shuffle<0,1,1,0>(f2);
268cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, f4[0] == 20);
269cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, f4[1] == 10);
270cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, f4[2] == 10);
271cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, f4[3] == 20);
272cb93a386Sopenharmony_ci}
273cb93a386Sopenharmony_ci
274cb93a386Sopenharmony_ciDEF_TEST(SkNx_int_float, r) {
275cb93a386Sopenharmony_ci    Sk4f f(-2.3f, 1.0f, 0.45f, 0.6f);
276cb93a386Sopenharmony_ci
277cb93a386Sopenharmony_ci    Sk4i i = SkNx_cast<int>(f);
278cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, i[0] == -2);
279cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, i[1] ==  1);
280cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, i[2] ==  0);
281cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, i[3] ==  0);
282cb93a386Sopenharmony_ci
283cb93a386Sopenharmony_ci    f = SkNx_cast<float>(i);
284cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, f[0] == -2.0f);
285cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, f[1] ==  1.0f);
286cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, f[2] ==  0.0f);
287cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, f[3] ==  0.0f);
288cb93a386Sopenharmony_ci}
289cb93a386Sopenharmony_ci
290cb93a386Sopenharmony_ci#include "include/utils/SkRandom.h"
291cb93a386Sopenharmony_ci
292cb93a386Sopenharmony_ciDEF_TEST(SkNx_u16_float, r) {
293cb93a386Sopenharmony_ci    {
294cb93a386Sopenharmony_ci        // u16 --> float
295cb93a386Sopenharmony_ci        auto h4 = Sk4h(15, 17, 257, 65535);
296cb93a386Sopenharmony_ci        auto f4 = SkNx_cast<float>(h4);
297cb93a386Sopenharmony_ci        REPORTER_ASSERT(r, f4[0] == 15.0f);
298cb93a386Sopenharmony_ci        REPORTER_ASSERT(r, f4[1] == 17.0f);
299cb93a386Sopenharmony_ci        REPORTER_ASSERT(r, f4[2] == 257.0f);
300cb93a386Sopenharmony_ci        REPORTER_ASSERT(r, f4[3] == 65535.0f);
301cb93a386Sopenharmony_ci    }
302cb93a386Sopenharmony_ci    {
303cb93a386Sopenharmony_ci        // float -> u16
304cb93a386Sopenharmony_ci        auto f4 = Sk4f(15, 17, 257, 65535);
305cb93a386Sopenharmony_ci        auto h4 = SkNx_cast<uint16_t>(f4);
306cb93a386Sopenharmony_ci        REPORTER_ASSERT(r, h4[0] == 15);
307cb93a386Sopenharmony_ci        REPORTER_ASSERT(r, h4[1] == 17);
308cb93a386Sopenharmony_ci        REPORTER_ASSERT(r, h4[2] == 257);
309cb93a386Sopenharmony_ci        REPORTER_ASSERT(r, h4[3] == 65535);
310cb93a386Sopenharmony_ci    }
311cb93a386Sopenharmony_ci
312cb93a386Sopenharmony_ci    // starting with any u16 value, we should be able to have a perfect round-trip in/out of floats
313cb93a386Sopenharmony_ci    //
314cb93a386Sopenharmony_ci    SkRandom rand;
315cb93a386Sopenharmony_ci    for (int i = 0; i < 10000; ++i) {
316cb93a386Sopenharmony_ci        const uint16_t s16[4] {
317cb93a386Sopenharmony_ci            (uint16_t)(rand.nextU() >> 16), (uint16_t)(rand.nextU() >> 16),
318cb93a386Sopenharmony_ci            (uint16_t)(rand.nextU() >> 16), (uint16_t)(rand.nextU() >> 16),
319cb93a386Sopenharmony_ci        };
320cb93a386Sopenharmony_ci        auto u4_0 = Sk4h::Load(s16);
321cb93a386Sopenharmony_ci        auto f4 = SkNx_cast<float>(u4_0);
322cb93a386Sopenharmony_ci        auto u4_1 = SkNx_cast<uint16_t>(f4);
323cb93a386Sopenharmony_ci        uint16_t d16[4];
324cb93a386Sopenharmony_ci        u4_1.store(d16);
325cb93a386Sopenharmony_ci        REPORTER_ASSERT(r, !memcmp(s16, d16, sizeof(s16)));
326cb93a386Sopenharmony_ci    }
327cb93a386Sopenharmony_ci}
328cb93a386Sopenharmony_ci
329cb93a386Sopenharmony_ci// The SSE2 implementation of SkNx_cast<uint16_t>(Sk4i) is non-trivial, so worth a test.
330cb93a386Sopenharmony_ciDEF_TEST(SkNx_int_u16, r) {
331cb93a386Sopenharmony_ci    // These are pretty hard to get wrong.
332cb93a386Sopenharmony_ci    for (int i = 0; i <= 0x7fff; i++) {
333cb93a386Sopenharmony_ci        uint16_t expected = (uint16_t)i;
334cb93a386Sopenharmony_ci        uint16_t actual = SkNx_cast<uint16_t>(Sk4i(i))[0];
335cb93a386Sopenharmony_ci
336cb93a386Sopenharmony_ci        REPORTER_ASSERT(r, expected == actual);
337cb93a386Sopenharmony_ci    }
338cb93a386Sopenharmony_ci
339cb93a386Sopenharmony_ci    // A naive implementation with _mm_packs_epi32 would succeed up to 0x7fff but fail here:
340cb93a386Sopenharmony_ci    for (int i = 0x8000; (1) && i <= 0xffff; i++) {
341cb93a386Sopenharmony_ci        uint16_t expected = (uint16_t)i;
342cb93a386Sopenharmony_ci        uint16_t actual = SkNx_cast<uint16_t>(Sk4i(i))[0];
343cb93a386Sopenharmony_ci
344cb93a386Sopenharmony_ci        REPORTER_ASSERT(r, expected == actual);
345cb93a386Sopenharmony_ci    }
346cb93a386Sopenharmony_ci}
347cb93a386Sopenharmony_ci
348cb93a386Sopenharmony_ciDEF_TEST(SkNx_4fLoad4Store4, r) {
349cb93a386Sopenharmony_ci    float src[] = {
350cb93a386Sopenharmony_ci         0.0f,  1.0f,  2.0f,  3.0f,
351cb93a386Sopenharmony_ci         4.0f,  5.0f,  6.0f,  7.0f,
352cb93a386Sopenharmony_ci         8.0f,  9.0f, 10.0f, 11.0f,
353cb93a386Sopenharmony_ci        12.0f, 13.0f, 14.0f, 15.0f
354cb93a386Sopenharmony_ci    };
355cb93a386Sopenharmony_ci
356cb93a386Sopenharmony_ci    Sk4f a, b, c, d;
357cb93a386Sopenharmony_ci    Sk4f::Load4(src, &a, &b, &c, &d);
358cb93a386Sopenharmony_ci    REPORTER_ASSERT(r,  0.0f == a[0]);
359cb93a386Sopenharmony_ci    REPORTER_ASSERT(r,  4.0f == a[1]);
360cb93a386Sopenharmony_ci    REPORTER_ASSERT(r,  8.0f == a[2]);
361cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, 12.0f == a[3]);
362cb93a386Sopenharmony_ci    REPORTER_ASSERT(r,  1.0f == b[0]);
363cb93a386Sopenharmony_ci    REPORTER_ASSERT(r,  5.0f == b[1]);
364cb93a386Sopenharmony_ci    REPORTER_ASSERT(r,  9.0f == b[2]);
365cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, 13.0f == b[3]);
366cb93a386Sopenharmony_ci    REPORTER_ASSERT(r,  2.0f == c[0]);
367cb93a386Sopenharmony_ci    REPORTER_ASSERT(r,  6.0f == c[1]);
368cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, 10.0f == c[2]);
369cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, 14.0f == c[3]);
370cb93a386Sopenharmony_ci    REPORTER_ASSERT(r,  3.0f == d[0]);
371cb93a386Sopenharmony_ci    REPORTER_ASSERT(r,  7.0f == d[1]);
372cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, 11.0f == d[2]);
373cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, 15.0f == d[3]);
374cb93a386Sopenharmony_ci
375cb93a386Sopenharmony_ci    float dst[16];
376cb93a386Sopenharmony_ci    Sk4f::Store4(dst, a, b, c, d);
377cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, 0 == memcmp(dst, src, 16 * sizeof(float)));
378cb93a386Sopenharmony_ci}
379cb93a386Sopenharmony_ci
380cb93a386Sopenharmony_ciDEF_TEST(SkNx_neg, r) {
381cb93a386Sopenharmony_ci    auto fs = -Sk4f(0.0f, -0.0f, 2.0f, -4.0f);
382cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, fs[0] == 0.0f);
383cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, fs[1] == 0.0f);
384cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, fs[2] == -2.0f);
385cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, fs[3] == 4.0f);
386cb93a386Sopenharmony_ci    auto fshi = -Sk2f(0.0f, -0.0f);
387cb93a386Sopenharmony_ci    auto fslo = -Sk2f(2.0f, -4.0f);
388cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, fshi[0] == 0.0f);
389cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, fshi[1] == 0.0f);
390cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, fslo[0] == -2.0f);
391cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, fslo[1] == 4.0f);
392cb93a386Sopenharmony_ci}
393cb93a386Sopenharmony_ci
394cb93a386Sopenharmony_ciDEF_TEST(SkNx_thenElse, r) {
395cb93a386Sopenharmony_ci    auto fs = (Sk4f(0.0f, -0.0f, 2.0f, -4.0f) < 0).thenElse(-1, 1);
396cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, fs[0] == 1);
397cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, fs[1] == 1);
398cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, fs[2] == 1);
399cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, fs[3] == -1);
400cb93a386Sopenharmony_ci    auto fshi = (Sk2f(0.0f, -0.0f) < 0).thenElse(-1, 1);
401cb93a386Sopenharmony_ci    auto fslo = (Sk2f(2.0f, -4.0f) < 0).thenElse(-1, 1);
402cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, fshi[0] == 1);
403cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, fshi[1] == 1);
404cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, fslo[0] == 1);
405cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, fslo[1] == -1);
406cb93a386Sopenharmony_ci}
407cb93a386Sopenharmony_ci
408cb93a386Sopenharmony_ciDEF_TEST(Sk4f_Load2, r) {
409cb93a386Sopenharmony_ci    float xy[8] = { 0,1,2,3,4,5,6,7 };
410cb93a386Sopenharmony_ci
411cb93a386Sopenharmony_ci    Sk4f x,y;
412cb93a386Sopenharmony_ci    Sk4f::Load2(xy, &x,&y);
413cb93a386Sopenharmony_ci
414cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, x[0] == 0);
415cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, x[1] == 2);
416cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, x[2] == 4);
417cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, x[3] == 6);
418cb93a386Sopenharmony_ci
419cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, y[0] == 1);
420cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, y[1] == 3);
421cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, y[2] == 5);
422cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, y[3] == 7);
423cb93a386Sopenharmony_ci}
424cb93a386Sopenharmony_ci
425cb93a386Sopenharmony_ciDEF_TEST(Sk2f_Load2, r) {
426cb93a386Sopenharmony_ci    float xy[4] = { 0,1,2,3 };
427cb93a386Sopenharmony_ci
428cb93a386Sopenharmony_ci    Sk2f x,y;
429cb93a386Sopenharmony_ci    Sk2f::Load2(xy, &x,&y);
430cb93a386Sopenharmony_ci
431cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, x[0] == 0);
432cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, x[1] == 2);
433cb93a386Sopenharmony_ci
434cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, y[0] == 1);
435cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, y[1] == 3);
436cb93a386Sopenharmony_ci}
437cb93a386Sopenharmony_ci
438cb93a386Sopenharmony_ciDEF_TEST(Sk2f_Store2, r) {
439cb93a386Sopenharmony_ci    Sk2f p0{0, 2};
440cb93a386Sopenharmony_ci    Sk2f p1{1, 3};
441cb93a386Sopenharmony_ci    float dst[4];
442cb93a386Sopenharmony_ci    Sk2f::Store2(dst, p0, p1);
443cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, dst[0] == 0);
444cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, dst[1] == 1);
445cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, dst[2] == 2);
446cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, dst[3] == 3);
447cb93a386Sopenharmony_ci}
448cb93a386Sopenharmony_ci
449cb93a386Sopenharmony_ciDEF_TEST(Sk2f_Store3, r) {
450cb93a386Sopenharmony_ci    Sk2f p0{0, 3};
451cb93a386Sopenharmony_ci    Sk2f p1{1, 4};
452cb93a386Sopenharmony_ci    Sk2f p2{2, 5};
453cb93a386Sopenharmony_ci    float dst[6];
454cb93a386Sopenharmony_ci    Sk2f::Store3(dst, p0, p1, p2);
455cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, dst[0] == 0);
456cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, dst[1] == 1);
457cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, dst[2] == 2);
458cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, dst[3] == 3);
459cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, dst[4] == 4);
460cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, dst[5] == 5);
461cb93a386Sopenharmony_ci}
462cb93a386Sopenharmony_ci
463cb93a386Sopenharmony_ciDEF_TEST(Sk2f_Store4, r) {
464cb93a386Sopenharmony_ci    Sk2f p0{0, 4};
465cb93a386Sopenharmony_ci    Sk2f p1{1, 5};
466cb93a386Sopenharmony_ci    Sk2f p2{2, 6};
467cb93a386Sopenharmony_ci    Sk2f p3{3, 7};
468cb93a386Sopenharmony_ci
469cb93a386Sopenharmony_ci    float dst[8] = {-1, -1, -1, -1, -1, -1, -1, -1};
470cb93a386Sopenharmony_ci    Sk2f::Store4(dst, p0, p1, p2, p3);
471cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, dst[0] == 0);
472cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, dst[1] == 1);
473cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, dst[2] == 2);
474cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, dst[3] == 3);
475cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, dst[4] == 4);
476cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, dst[5] == 5);
477cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, dst[6] == 6);
478cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, dst[7] == 7);
479cb93a386Sopenharmony_ci
480cb93a386Sopenharmony_ci    // Ensure transposing to Sk4f works.
481cb93a386Sopenharmony_ci    Sk4f dst4f[2] = {{-1, -1, -1, -1}, {-1, -1, -1, -1}};
482cb93a386Sopenharmony_ci    Sk2f::Store4(dst4f, p0, p1, p2, p3);
483cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, dst4f[0][0] == 0);
484cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, dst4f[0][1] == 1);
485cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, dst4f[0][2] == 2);
486cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, dst4f[0][3] == 3);
487cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, dst4f[1][0] == 4);
488cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, dst4f[1][1] == 5);
489cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, dst4f[1][2] == 6);
490cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, dst4f[1][3] == 7);
491cb93a386Sopenharmony_ci
492cb93a386Sopenharmony_ci}
493cb93a386Sopenharmony_ci
494cb93a386Sopenharmony_ciDEF_TEST(Sk4f_minmax, r) {
495cb93a386Sopenharmony_ci    REPORTER_ASSERT(r,  3 == Sk4f(0,1,2,3).max());
496cb93a386Sopenharmony_ci    REPORTER_ASSERT(r,  2 == Sk4f(1,-5,2,-1).max());
497cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, -1 == Sk4f(-2,-1,-6,-3).max());
498cb93a386Sopenharmony_ci    REPORTER_ASSERT(r,  3 == Sk4f(3,2,1,0).max());
499cb93a386Sopenharmony_ci
500cb93a386Sopenharmony_ci    REPORTER_ASSERT(r,  0 == Sk4f(0,1,2,3).min());
501cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, -5 == Sk4f(1,-5,2,-1).min());
502cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, -6 == Sk4f(-2,-1,-6,-3).min());
503cb93a386Sopenharmony_ci    REPORTER_ASSERT(r,  0 == Sk4f(3,2,1,0).min());
504cb93a386Sopenharmony_ci}
505cb93a386Sopenharmony_ci
506cb93a386Sopenharmony_ciDEF_TEST(SkNf_anyTrue_allTrue, r) {
507cb93a386Sopenharmony_ci    REPORTER_ASSERT(r,  (Sk2f{1,2} < Sk2f{3,4}).anyTrue());
508cb93a386Sopenharmony_ci    REPORTER_ASSERT(r,  (Sk2f{1,2} < Sk2f{3,4}).allTrue());
509cb93a386Sopenharmony_ci    REPORTER_ASSERT(r,  (Sk2f{3,2} < Sk2f{1,4}).anyTrue());
510cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, !(Sk2f{3,2} < Sk2f{1,4}).allTrue());
511cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, !(Sk2f{3,4} < Sk2f{1,2}).anyTrue());
512cb93a386Sopenharmony_ci
513cb93a386Sopenharmony_ci    REPORTER_ASSERT(r,  (Sk4f{1,2,3,4} < Sk4f{3,4,5,6}).anyTrue());
514cb93a386Sopenharmony_ci    REPORTER_ASSERT(r,  (Sk4f{1,2,3,4} < Sk4f{3,4,5,6}).allTrue());
515cb93a386Sopenharmony_ci    REPORTER_ASSERT(r,  (Sk4f{1,2,3,4} < Sk4f{1,4,1,1}).anyTrue());
516cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, !(Sk4f{1,2,3,4} < Sk4f{1,4,1,1}).allTrue());
517cb93a386Sopenharmony_ci    REPORTER_ASSERT(r, !(Sk4f{3,4,5,6} < Sk4f{1,2,3,4}).anyTrue());
518cb93a386Sopenharmony_ci}
519