diff options
author | Nikolay Bogoychev <nheart@gmail.com> | 2019-05-29 19:37:11 +0300 |
---|---|---|
committer | Nikolay Bogoychev <nheart@gmail.com> | 2019-05-29 19:37:11 +0300 |
commit | 0d01e603b92ee948232316cda7f0149e81666537 (patch) | |
tree | 6d7a9c60c18031ca2da0e195d013ffd1820c2c5b /multiply.h | |
parent | be86198e1b08b1b8098393814d77fc307c59006e (diff) | |
parent | 35dbeec838da533262fc5947dfa82aed58a50653 (diff) |
merge with master
Diffstat (limited to 'multiply.h')
-rw-r--r-- | multiply.h | 8 |
1 files changed, 4 insertions, 4 deletions
@@ -135,9 +135,9 @@ INTGEMM_PACK0123(INTGEMM_AVX512BW, __m512i) const int simd_width = width / (sizeof(Integer) / sizeof(int16_t)); \ typename WriteC::WriteCSubType write_C(C); \ const Integer *B0_col = reinterpret_cast<const Integer *>(B); \ - for (int B0_colidx = 0; B0_colidx < B_cols; B0_col += 8 * simd_width, B0_colidx += 8) { \ + for (Index B0_colidx = 0; B0_colidx < B_cols; B0_col += 8 * simd_width, B0_colidx += 8) { \ /* Process one row of A at a time. Doesn't seem to be faster to do multiple rows of A at once.*/ \ - for (int A_rowidx = 0; A_rowidx < A_rows; ++A_rowidx) { \ + for (Index A_rowidx = 0; A_rowidx < A_rows; ++A_rowidx) { \ const Integer *A_row = reinterpret_cast<const Integer*>(A + A_rowidx * width); \ /* These will be packed 32-bit integers containing sums for each row of B multiplied by the row of A. \ Iterate over shared (inner) dimension.*/ \ @@ -340,9 +340,9 @@ template <class WriteC> target static void Multiply(const int8_t *A, const int8_ const Integer *B0_col = reinterpret_cast<const Integer*>(B); \ typename WriteC::WriteCSubType c_writer(C); \ /*Go over 8 columns of B at a time.*/ \ - for (int B0_colidx = 0; B0_colidx != B_cols; B0_col += 8 * simd_width, B0_colidx += 8) { \ + for (Index B0_colidx = 0; B0_colidx != B_cols; B0_col += 8 * simd_width, B0_colidx += 8) { \ /*Process one row of A at a time. Doesn't seem to be faster to do multiple rows of A at once.*/ \ - for (int A_rowidx = 0; A_rowidx < A_rows; ++A_rowidx) { \ + for (Index A_rowidx = 0; A_rowidx < A_rows; ++A_rowidx) { \ /*Iterate over shared (inner) dimension.*/ \ const Integer *A_live = reinterpret_cast<const Integer *>(A + A_rowidx * width); \ const Integer *A_end = A_live + simd_width; \ |