diff options
Diffstat (limited to 'ssse3_gemm.h')
-rw-r--r-- | ssse3_gemm.h | 13 |
1 files changed, 3 insertions, 10 deletions
diff --git a/ssse3_gemm.h b/ssse3_gemm.h index 9c21467..4e12b90 100644 --- a/ssse3_gemm.h +++ b/ssse3_gemm.h @@ -88,21 +88,14 @@ struct SSSE3_8bit { // Tile size for B; B must be a multiple of this block size. static const Index kBTileRow = 16; static const Index kBTileCol = 8; -/* - INTGEMM_SSSE3 static void PrepareB(const float *input, int8_t *output, float quant_mult, Index rows, Index cols) { - PrepareBFor8(input, output, ssse3::QuantizeTile8(quant_mult), rows, cols); - }*/ + INTGEMM_PREPARE_B_8(INTGEMM_SSSE3, ssse3::QuantizeTile8) INTGEMM_SSSE3 static void SelectColumnsB(const int8_t *input, int8_t *output, Index rows, const Index *cols_begin, const Index *cols_end) { ssse3::SelectColumnsOfB((const __m128i*)input, (__m128i*)output, rows, cols_begin, cols_end); } -/* - INTGEMM_SSSE3 static void Multiply(const int8_t *A, const int8_t *B, float *C, float unquant_mult, Index A_rows, Index width, Index B_cols) { - //Multiply8_SSE2OrAVX2<Multiply8_C, __m128i, __m128>(A, B, C, unquant_mult, A_rows, width, B_cols); - Multiply8_SSE2OrAVX2__m128i<JustUnquantizeC>(A, B, JustUnquantizeC(C, unquant_mult), A_rows, width, B_cols); - }*/ - INTGEMM_MULTIPLY8(__m128i, INTGEMM_SSSE3, OnSSE2) + + INTGEMM_MULTIPLY8(__m128i, INTGEMM_SSSE3, CPUType::CPU_SSE2) constexpr static const char *const kName = "8-bit INTGEMM_SSSE3"; |