#include "test/test.h" #include "aligned.h" #include "kernels.h" #include namespace intgemm { template void kernel_multiply_test() { if (kCPU < CPUType_) return; using vec_t = vector_t; constexpr static auto VECTOR_LENGTH = sizeof(vec_t) / sizeof(Type_); AlignedVector input1(VECTOR_LENGTH); AlignedVector input2(VECTOR_LENGTH); AlignedVector output(VECTOR_LENGTH); std::iota(input1.begin(), input1.end(), -int(VECTOR_LENGTH / 2)); std::iota(input2.begin(), input2.end(), -int(VECTOR_LENGTH / 3)); *output.template as() = kernels::multiply(*input1.template as(), *input2.template as()); for (auto i = 0; i < output.size(); ++i) CHECK(output[i] == Type_(input1[i] * input2[i])); } template INTGEMM_SSE2 void kernel_multiply_test(); template INTGEMM_SSE2 void kernel_multiply_test(); template INTGEMM_SSE2 void kernel_multiply_test(); template INTGEMM_SSE2 void kernel_multiply_test(); template INTGEMM_SSE2 void kernel_multiply_test(); KERNEL_TEST_CASE("multiply/int8 SSE2") { return kernel_multiply_test(); } KERNEL_TEST_CASE("multiply/int16 SSE2") { return kernel_multiply_test(); } KERNEL_TEST_CASE("multiply/int SSE2") { return kernel_multiply_test(); } KERNEL_TEST_CASE("multiply/float SSE2") { return kernel_multiply_test(); } KERNEL_TEST_CASE("multiply/double SSE2") { return kernel_multiply_test(); } template INTGEMM_AVX2 void kernel_multiply_test(); template INTGEMM_AVX2 void kernel_multiply_test(); template INTGEMM_AVX2 void kernel_multiply_test(); template INTGEMM_AVX2 void kernel_multiply_test(); template INTGEMM_AVX2 void kernel_multiply_test(); KERNEL_TEST_CASE("multiply/int8 AVX2") { return kernel_multiply_test(); } KERNEL_TEST_CASE("multiply/int16 AVX2") { return kernel_multiply_test(); } KERNEL_TEST_CASE("multiply/int AVX2") { return kernel_multiply_test(); } KERNEL_TEST_CASE("multiply/float AVX2") { return kernel_multiply_test(); } KERNEL_TEST_CASE("multiply/double AVX2") { return kernel_multiply_test(); } #ifdef INTGEMM_COMPILER_SUPPORTS_AVX512 template INTGEMM_AVX512BW void kernel_multiply_test(); template INTGEMM_AVX512BW void kernel_multiply_test(); template INTGEMM_AVX512BW void kernel_multiply_test(); template INTGEMM_AVX512BW void kernel_multiply_test(); template INTGEMM_AVX512BW void kernel_multiply_test(); KERNEL_TEST_CASE("multiply/int8 AVX512BW") { return kernel_multiply_test(); } KERNEL_TEST_CASE("multiply/int16 AVX512BW") { return kernel_multiply_test(); } KERNEL_TEST_CASE("multiply/int AVX512BW") { return kernel_multiply_test(); } KERNEL_TEST_CASE("multiply/float AVX512BW") { return kernel_multiply_test(); } KERNEL_TEST_CASE("multiply/double AVX512BW") { return kernel_multiply_test(); } #endif }