#include "../test.h" #include "../../aligned.h" #include "../../kernels.h" #include namespace intgemm { template void kernel_floor_test() { if (kCPU < CPUType_) return; using vec_t = vector_t; constexpr static auto VECTOR_LENGTH = sizeof(vec_t) / sizeof(float); AlignedVector input(VECTOR_LENGTH); AlignedVector output(VECTOR_LENGTH); std::iota(input.begin(), input.end(), -int(VECTOR_LENGTH / 2)); *output.template as() = kernels::floor(*input.template as()); for (std::size_t i = 0; i < output.size(); ++i) CHECK(output[i] == std::floor(input[i])); } template INTGEMM_SSE2 void kernel_floor_test(); KERNEL_TEST_CASE("floor SSE2") { return kernel_floor_test(); } template INTGEMM_AVX2 void kernel_floor_test(); KERNEL_TEST_CASE("floor AVX2") { return kernel_floor_test(); } #ifdef INTGEMM_COMPILER_SUPPORTS_AVX512 template INTGEMM_AVX512BW void kernel_floor_test(); KERNEL_TEST_CASE("floor AVX512BW") { return kernel_floor_test(); } #endif }