diff options
author | Kenneth Heafield <github@kheafield.com> | 2018-07-01 01:52:41 +0300 |
---|---|---|
committer | Kenneth Heafield <github@kheafield.com> | 2018-07-01 01:52:41 +0300 |
commit | 93e1c884fb351a52e94700fd8793c2bb395194fb (patch) | |
tree | baaabac11b46e83c216617017c02e8382357f6ae | |
parent | 7bd7cba6c0cc29d16d2fef5272164a65e0099871 (diff) | |
parent | 96f35bbbc99a91aac85005b7a35e5d0605fa6e32 (diff) |
Merge branch 'master' of github.com:kpu/intgemm
-rw-r--r-- | multiply_test.cc | 10 |
1 files changed, 6 insertions, 4 deletions
diff --git a/multiply_test.cc b/multiply_test.cc index 236bca5..1700399 100644 --- a/multiply_test.cc +++ b/multiply_test.cc @@ -135,7 +135,7 @@ template <class Routine> void TestSelectColumnsB(int rows = 32, int cols = 16) { AlignedVector<Integer> prepared(rows * cols); Routine::PrepareB(input.get(), prepared.get(), 1, rows, cols); - int kSelectCols = 8; + int kSelectCols = 24; std::size_t select_cols[kSelectCols]; for (int i = 0; i < kSelectCols; ++i) { select_cols[i] = rand() % cols; @@ -326,19 +326,21 @@ int main(int argc, char ** argv) { TestPrepare<AVX512_16bit>(32, 8); TestPrepare<AVX512_16bit>(256, 32); TestSelectColumnsB<AVX512_8bit>(); - TestSelectColumnsB<AVX512_16bit>(); + TestSelectColumnsB<AVX512_16bit>(256, 256); #endif TestPrepare<AVX2_8bit>(64, 32); TestPrepare<AVX2_16bit>(64, 32); - TestSelectColumnsB<AVX2_8bit>(); - TestSelectColumnsB<AVX2_16bit>(); + TestSelectColumnsB<AVX2_8bit>(256, 256); + TestSelectColumnsB<AVX2_16bit>(256, 256); TestPrepare<SSSE3_8bit>(16, 8); TestPrepare<SSSE3_8bit>(32, 16); TestPrepare<SSSE3_8bit>(32, 32); TestSelectColumnsB<SSSE3_8bit>(); + TestSelectColumnsB<SSSE3_8bit>(256, 256); TestPrepare<SSE2_16bit>(8, 8); TestPrepare<SSE2_16bit>(32, 32); TestSelectColumnsB<SSE2_16bit>(); + TestSelectColumnsB<SSE2_16bit>(256, 256); TestMax<__m128>(); TestMaxAbsolute<SSE2_MaxAbsolute>(); /* if (kCPU >= CPU_AVX2) { |