#include "../test.h" #include "../../aligned.h" #include "../../kernels.h" #include namespace intgemm { template void kernel_quantize_test() { if (kCPU < CPUType_) return; using input_vec_t = vector_t; using output_vec_t = vector_t; AlignedVector input(sizeof(input_vec_t) / sizeof(float)); AlignedVector output(sizeof(output_vec_t) / sizeof(int)); std::iota(input.begin(), input.end(), 0); auto quant_mult = set1_ps(2.f); *output.template as() = kernels::quantize(*input.template as(), quant_mult); for (std::size_t i = 0; i < output.size(); ++i) CHECK(output[i] == int(i*2.f)); } template INTGEMM_SSE2 void kernel_quantize_test(); KERNEL_TEST_CASE("quantize SSE2") { return kernel_quantize_test(); } template INTGEMM_AVX2 void kernel_quantize_test(); KERNEL_TEST_CASE("quantize AVX2") { return kernel_quantize_test(); } #ifdef INTGEMM_COMPILER_SUPPORTS_AVX512 template INTGEMM_AVX512BW void kernel_quantize_test(); KERNEL_TEST_CASE("quantize AVX512BW") { return kernel_quantize_test(); } #endif }