libjxl

FORK: libjxl patches used on blog
git clone https://git.neptards.moe/blog/libjxl.git
Log | Files | Refs | Submodules | README | LICENSE

simd_util_test.cc (2465B)


      1 // Copyright (c) the JPEG XL Project Authors. All rights reserved.
      2 //
      3 // Use of this source code is governed by a BSD-style
      4 // license that can be found in the LICENSE file.
      5 
      6 #include "lib/jxl/testing.h"
      7 
      8 #undef HWY_TARGET_INCLUDE
      9 #define HWY_TARGET_INCLUDE "lib/jxl/simd_util_test.cc"
     10 #include <hwy/foreach_target.h>
     11 
     12 #include "lib/jxl/simd_util-inl.h"
     13 
     14 // Test utils
     15 #include <hwy/highway.h>
     16 #include <hwy/tests/hwy_gtest.h>
     17 HWY_BEFORE_NAMESPACE();
     18 namespace jxl {
     19 namespace HWY_NAMESPACE {
     20 namespace {
     21 
     22 HWY_NOINLINE void TestInterleave2() {
     23   HWY_FULL(float) d;
     24   auto vec1 = Iota(d, 0 * 128.0);
     25   auto vec2 = Iota(d, 1 * 128.0);
     26   HWY_ALIGN float mem[MaxLanes(d) * 2];
     27   StoreInterleaved(d, vec1, vec2, mem);
     28   for (size_t i = 0; i < Lanes(d); i++) {
     29     for (size_t j = 0; j < 2; j++) {
     30       EXPECT_EQ(mem[2 * i + j], j * 128 + i) << "i: " << i << " j: " << j;
     31     }
     32   }
     33 }
     34 HWY_NOINLINE void TestInterleave4() {
     35   HWY_FULL(float) d;
     36   auto vec1 = Iota(d, 0 * 128.0);
     37   auto vec2 = Iota(d, 1 * 128.0);
     38   auto vec3 = Iota(d, 2 * 128.0);
     39   auto vec4 = Iota(d, 3 * 128.0);
     40   HWY_ALIGN float mem[MaxLanes(d) * 4];
     41   StoreInterleaved(d, vec1, vec2, vec3, vec4, mem);
     42   for (size_t i = 0; i < Lanes(d); i++) {
     43     for (size_t j = 0; j < 4; j++) {
     44       EXPECT_EQ(mem[4 * i + j], j * 128 + i) << "i: " << i << " j: " << j;
     45     }
     46   }
     47 }
     48 HWY_NOINLINE void TestInterleave8() {
     49   HWY_FULL(float) d;
     50   auto vec1 = Iota(d, 0 * 128.0);
     51   auto vec2 = Iota(d, 1 * 128.0);
     52   auto vec3 = Iota(d, 2 * 128.0);
     53   auto vec4 = Iota(d, 3 * 128.0);
     54   auto vec5 = Iota(d, 4 * 128.0);
     55   auto vec6 = Iota(d, 5 * 128.0);
     56   auto vec7 = Iota(d, 6 * 128.0);
     57   auto vec8 = Iota(d, 7 * 128.0);
     58   HWY_ALIGN float mem[MaxLanes(d) * 8];
     59   StoreInterleaved(d, vec1, vec2, vec3, vec4, vec5, vec6, vec7, vec8, mem);
     60   for (size_t i = 0; i < Lanes(d); i++) {
     61     for (size_t j = 0; j < 8; j++) {
     62       EXPECT_EQ(mem[8 * i + j], j * 128 + i) << "i: " << i << " j: " << j;
     63     }
     64   }
     65 }
     66 
     67 }  // namespace
     68 // NOLINTNEXTLINE(google-readability-namespace-comments)
     69 }  // namespace HWY_NAMESPACE
     70 }  // namespace jxl
     71 HWY_AFTER_NAMESPACE();
     72 
     73 #if HWY_ONCE
     74 namespace jxl {
     75 
     76 class SimdUtilTargetTest : public hwy::TestWithParamTarget {};
     77 HWY_TARGET_INSTANTIATE_TEST_SUITE_P(SimdUtilTargetTest);
     78 
     79 HWY_EXPORT_AND_TEST_P(SimdUtilTargetTest, TestInterleave2);
     80 HWY_EXPORT_AND_TEST_P(SimdUtilTargetTest, TestInterleave4);
     81 HWY_EXPORT_AND_TEST_P(SimdUtilTargetTest, TestInterleave8);
     82 
     83 }  // namespace jxl
     84 #endif  // HWY_ONCE