#include "../test.h" #include "../../aligned.h" #include "../../kernels.h" #include namespace intgemm { template void kernel_rescale_test() { if (kCPU < CPUType_) return; using vi = vector_t; using vf = vector_t; const int LENGTH = sizeof(vi) / sizeof(int); AlignedVector input(LENGTH); AlignedVector output(LENGTH); std::iota(input.begin(), input.end(), -LENGTH / 2); float scale = 2; *output.template as() = kernels::rescale(*input.template as(), intgemm::set1_ps(scale)); for (std::size_t i = 0; i < output.size(); ++i) CHECK(output[i] == std::round(input[i] * scale)); } template INTGEMM_SSE2 void kernel_rescale_test(); KERNEL_TEST_CASE("rescale SSE2") { return kernel_rescale_test(); } template INTGEMM_AVX2 void kernel_rescale_test(); KERNEL_TEST_CASE("rescale AVX2") { return kernel_rescale_test(); } #ifdef INTGEMM_COMPILER_SUPPORTS_AVX512BW template INTGEMM_AVX512BW void kernel_rescale_test(); KERNEL_TEST_CASE("rescale AVX512BW") { return kernel_rescale_test(); } #endif }