tor-browser

The Tor Browser
git clone https://git.dasho.dev/tor-browser.git
Log | Files | Refs | README | LICENSE

simd_util_test.cc (2465B)


      1 // Copyright (c) the JPEG XL Project Authors. All rights reserved.
      2 //
      3 // Use of this source code is governed by a BSD-style
      4 // license that can be found in the LICENSE file.
      5 
      6 #include "lib/jxl/testing.h"
      7 
      8 #undef HWY_TARGET_INCLUDE
      9 #define HWY_TARGET_INCLUDE "lib/jxl/simd_util_test.cc"
     10 #include <hwy/foreach_target.h>
     11 
     12 #include "lib/jxl/simd_util-inl.h"
     13 
     14 // Test utils
     15 #include <hwy/highway.h>
     16 #include <hwy/tests/hwy_gtest.h>
     17 HWY_BEFORE_NAMESPACE();
     18 namespace jxl {
     19 namespace HWY_NAMESPACE {
     20 namespace {
     21 
     22 HWY_NOINLINE void TestInterleave2() {
     23  HWY_FULL(float) d;
     24  auto vec1 = Iota(d, 0 * 128.0);
     25  auto vec2 = Iota(d, 1 * 128.0);
     26  HWY_ALIGN float mem[MaxLanes(d) * 2];
     27  StoreInterleaved(d, vec1, vec2, mem);
     28  for (size_t i = 0; i < Lanes(d); i++) {
     29    for (size_t j = 0; j < 2; j++) {
     30      EXPECT_EQ(mem[2 * i + j], j * 128 + i) << "i: " << i << " j: " << j;
     31    }
     32  }
     33 }
     34 HWY_NOINLINE void TestInterleave4() {
     35  HWY_FULL(float) d;
     36  auto vec1 = Iota(d, 0 * 128.0);
     37  auto vec2 = Iota(d, 1 * 128.0);
     38  auto vec3 = Iota(d, 2 * 128.0);
     39  auto vec4 = Iota(d, 3 * 128.0);
     40  HWY_ALIGN float mem[MaxLanes(d) * 4];
     41  StoreInterleaved(d, vec1, vec2, vec3, vec4, mem);
     42  for (size_t i = 0; i < Lanes(d); i++) {
     43    for (size_t j = 0; j < 4; j++) {
     44      EXPECT_EQ(mem[4 * i + j], j * 128 + i) << "i: " << i << " j: " << j;
     45    }
     46  }
     47 }
     48 HWY_NOINLINE void TestInterleave8() {
     49  HWY_FULL(float) d;
     50  auto vec1 = Iota(d, 0 * 128.0);
     51  auto vec2 = Iota(d, 1 * 128.0);
     52  auto vec3 = Iota(d, 2 * 128.0);
     53  auto vec4 = Iota(d, 3 * 128.0);
     54  auto vec5 = Iota(d, 4 * 128.0);
     55  auto vec6 = Iota(d, 5 * 128.0);
     56  auto vec7 = Iota(d, 6 * 128.0);
     57  auto vec8 = Iota(d, 7 * 128.0);
     58  HWY_ALIGN float mem[MaxLanes(d) * 8];
     59  StoreInterleaved(d, vec1, vec2, vec3, vec4, vec5, vec6, vec7, vec8, mem);
     60  for (size_t i = 0; i < Lanes(d); i++) {
     61    for (size_t j = 0; j < 8; j++) {
     62      EXPECT_EQ(mem[8 * i + j], j * 128 + i) << "i: " << i << " j: " << j;
     63    }
     64  }
     65 }
     66 
     67 }  // namespace
     68 // NOLINTNEXTLINE(google-readability-namespace-comments)
     69 }  // namespace HWY_NAMESPACE
     70 }  // namespace jxl
     71 HWY_AFTER_NAMESPACE();
     72 
     73 #if HWY_ONCE
     74 namespace jxl {
     75 
     76 class SimdUtilTargetTest : public hwy::TestWithParamTarget {};
     77 HWY_TARGET_INSTANTIATE_TEST_SUITE_P(SimdUtilTargetTest);
     78 
     79 HWY_EXPORT_AND_TEST_P(SimdUtilTargetTest, TestInterleave2);
     80 HWY_EXPORT_AND_TEST_P(SimdUtilTargetTest, TestInterleave4);
     81 HWY_EXPORT_AND_TEST_P(SimdUtilTargetTest, TestInterleave8);
     82 
     83 }  // namespace jxl
     84 #endif  // HWY_ONCE