Welcome to mirror list, hosted at ThFree Co, Russian Federation.

github.com/marian-nmt/intgemm.git - Unnamed repository; edit this file 'description' to name the repository.
summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorKenneth Heafield <github@kheafield.com>2018-07-01 01:52:41 +0300
committerKenneth Heafield <github@kheafield.com>2018-07-01 01:52:41 +0300
commit93e1c884fb351a52e94700fd8793c2bb395194fb (patch)
treebaaabac11b46e83c216617017c02e8382357f6ae
parent7bd7cba6c0cc29d16d2fef5272164a65e0099871 (diff)
parent96f35bbbc99a91aac85005b7a35e5d0605fa6e32 (diff)
Merge branch 'master' of github.com:kpu/intgemm
-rw-r--r--multiply_test.cc10
1 files changed, 6 insertions, 4 deletions
diff --git a/multiply_test.cc b/multiply_test.cc
index 236bca5..1700399 100644
--- a/multiply_test.cc
+++ b/multiply_test.cc
@@ -135,7 +135,7 @@ template <class Routine> void TestSelectColumnsB(int rows = 32, int cols = 16) {
AlignedVector<Integer> prepared(rows * cols);
Routine::PrepareB(input.get(), prepared.get(), 1, rows, cols);
- int kSelectCols = 8;
+ int kSelectCols = 24;
std::size_t select_cols[kSelectCols];
for (int i = 0; i < kSelectCols; ++i) {
select_cols[i] = rand() % cols;
@@ -326,19 +326,21 @@ int main(int argc, char ** argv) {
TestPrepare<AVX512_16bit>(32, 8);
TestPrepare<AVX512_16bit>(256, 32);
TestSelectColumnsB<AVX512_8bit>();
- TestSelectColumnsB<AVX512_16bit>();
+ TestSelectColumnsB<AVX512_16bit>(256, 256);
#endif
TestPrepare<AVX2_8bit>(64, 32);
TestPrepare<AVX2_16bit>(64, 32);
- TestSelectColumnsB<AVX2_8bit>();
- TestSelectColumnsB<AVX2_16bit>();
+ TestSelectColumnsB<AVX2_8bit>(256, 256);
+ TestSelectColumnsB<AVX2_16bit>(256, 256);
TestPrepare<SSSE3_8bit>(16, 8);
TestPrepare<SSSE3_8bit>(32, 16);
TestPrepare<SSSE3_8bit>(32, 32);
TestSelectColumnsB<SSSE3_8bit>();
+ TestSelectColumnsB<SSSE3_8bit>(256, 256);
TestPrepare<SSE2_16bit>(8, 8);
TestPrepare<SSE2_16bit>(32, 32);
TestSelectColumnsB<SSE2_16bit>();
+ TestSelectColumnsB<SSE2_16bit>(256, 256);
TestMax<__m128>();
TestMaxAbsolute<SSE2_MaxAbsolute>();
/* if (kCPU >= CPU_AVX2) {