Welcome to mirror list, hosted at ThFree Co, Russian Federation.

github.com/marian-nmt/intgemm/intgemm.git - Unnamed repository; edit this file 'description' to name the repository.
summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorNikolay Bogoychev <nheart@gmail.com>2019-04-12 23:11:03 +0300
committerNikolay Bogoychev <nheart@gmail.com>2019-04-12 23:11:03 +0300
commit627ab821c71606aa6ff4947640def78b4f2b192c (patch)
treec8a9096dcc4e769529467c90336b412a7bf4b8b3 /ssse3_gemm.h
parent6d7d1877554045a0b5e809a1f286c4a38bd98233 (diff)
Mostly working
Diffstat (limited to 'ssse3_gemm.h')
-rw-r--r--ssse3_gemm.h8
1 files changed, 5 insertions, 3 deletions
diff --git a/ssse3_gemm.h b/ssse3_gemm.h
index 69ac298..2b830a9 100644
--- a/ssse3_gemm.h
+++ b/ssse3_gemm.h
@@ -86,17 +86,19 @@ struct SSSE3_8bit {
// Tile size for B; B must be a multiple of this block size.
static const Index kBTileRow = 16;
static const Index kBTileCol = 8;
-
+/*
SSSE3 static void PrepareB(const float *input, int8_t *output, float quant_mult, Index rows, Index cols) {
PrepareBFor8(input, output, ssse3::QuantizeTile8(quant_mult), rows, cols);
- }
+ }*/
+ PREPARE_B_8_DEF(SSSE3, ssse3::QuantizeTile8)
SSSE3 static void SelectColumnsB(const int8_t *input, int8_t *output, Index rows, const Index *cols_begin, const Index *cols_end) {
SelectColumnsOfB((const __m128i*)input, (__m128i*)output, rows, cols_begin, cols_end);
}
SSSE3 static void Multiply(const int8_t *A, const int8_t *B, float *C, float unquant_mult, Index A_rows, Index width, Index B_cols) {
- Multiply8_SSE2OrAVX2<Multiply8_C, __m128i, __m128>(A, B, C, unquant_mult, A_rows, width, B_cols);
+ //Multiply8_SSE2OrAVX2<Multiply8_C, __m128i, __m128>(A, B, C, unquant_mult, A_rows, width, B_cols);
+ Multiply8_SSE2OrAVX2__m128i<Multiply8_C>(A, B, C, unquant_mult, A_rows, width, B_cols);
}
constexpr static const char *const kName = "8-bit SSSE3";