diff options
Diffstat (limited to 'ssse3_gemm.h')
-rw-r--r-- | ssse3_gemm.h | 4 |
1 files changed, 4 insertions, 0 deletions
diff --git a/ssse3_gemm.h b/ssse3_gemm.h index fd3ab8c..5841541 100644 --- a/ssse3_gemm.h +++ b/ssse3_gemm.h @@ -20,6 +20,7 @@ INTGEMM_SSSE3 inline __m128i QuantizerGrab(const float *input, const __m128 quan } INTGEMM_SELECT_COL_B(INTGEMM_SSSE3, __m128i) +INTGEMM_SELECT_COL_B_COLUMN_MAJOR(INTGEMM_SSSE3, __m128i) class QuantizeTile8 { public: @@ -149,6 +150,9 @@ struct SSSE3_8bit { INTGEMM_SSSE3 static void SelectColumnsB(const int8_t *input, int8_t *output, Index rows, const Index *cols_begin, const Index *cols_end) { ssse3::SelectColumnsOfB((const __m128i*)input, (__m128i*)output, rows, cols_begin, cols_end); } + INTGEMM_SSSE3 static void SelectColumnsB_ColumnsMajor(const int8_t *input, int8_t *output, Index rows, const Index *cols_begin, const Index *cols_end) { + ssse3::SelectColumnsOfB_ColumnMajor((const __m128i*)input, (__m128i*)output, rows, cols_begin, cols_end); + } INTGEMM_MULTIPLY8(__m128i, INTGEMM_SSSE3, CPUType::SSE2) |