Welcome to mirror list, hosted at ThFree Co, Russian Federation.

github.com/marian-nmt/intgemm.git - Unnamed repository; edit this file 'description' to name the repository.
summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
Diffstat (limited to 'ssse3_gemm.h')
-rw-r--r--ssse3_gemm.h13
1 files changed, 3 insertions, 10 deletions
diff --git a/ssse3_gemm.h b/ssse3_gemm.h
index 9c21467..4e12b90 100644
--- a/ssse3_gemm.h
+++ b/ssse3_gemm.h
@@ -88,21 +88,14 @@ struct SSSE3_8bit {
// Tile size for B; B must be a multiple of this block size.
static const Index kBTileRow = 16;
static const Index kBTileCol = 8;
-/*
- INTGEMM_SSSE3 static void PrepareB(const float *input, int8_t *output, float quant_mult, Index rows, Index cols) {
- PrepareBFor8(input, output, ssse3::QuantizeTile8(quant_mult), rows, cols);
- }*/
+
INTGEMM_PREPARE_B_8(INTGEMM_SSSE3, ssse3::QuantizeTile8)
INTGEMM_SSSE3 static void SelectColumnsB(const int8_t *input, int8_t *output, Index rows, const Index *cols_begin, const Index *cols_end) {
ssse3::SelectColumnsOfB((const __m128i*)input, (__m128i*)output, rows, cols_begin, cols_end);
}
-/*
- INTGEMM_SSSE3 static void Multiply(const int8_t *A, const int8_t *B, float *C, float unquant_mult, Index A_rows, Index width, Index B_cols) {
- //Multiply8_SSE2OrAVX2<Multiply8_C, __m128i, __m128>(A, B, C, unquant_mult, A_rows, width, B_cols);
- Multiply8_SSE2OrAVX2__m128i<JustUnquantizeC>(A, B, JustUnquantizeC(C, unquant_mult), A_rows, width, B_cols);
- }*/
- INTGEMM_MULTIPLY8(__m128i, INTGEMM_SSSE3, OnSSE2)
+
+ INTGEMM_MULTIPLY8(__m128i, INTGEMM_SSSE3, CPUType::CPU_SSE2)
constexpr static const char *const kName = "8-bit INTGEMM_SSSE3";