Welcome to mirror list, hosted at ThFree Co, Russian Federation.

github.com/marian-nmt/FBGEMM.git - Unnamed repository; edit this file 'description' to name the repository.
summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorJianyu Huang <jianyuhuang@fb.com>2018-11-08 22:09:04 +0300
committerJianyu Huang <jianyuhuang@fb.com>2018-11-08 22:09:04 +0300
commit428a0b6cede232eb5c4e9c3bbd8e9d74d8e34500 (patch)
tree8597c3316e00e00fa5d0fc8939c9ae5c518f767a /src/ExecuteKernelU8S8.cc
parentd90e2e1659f9f991319d05bfc58640aeafa733aa (diff)
Sync with internal copy: Asymmetric padding; fbgemm2 -> fbgemm
Diffstat (limited to 'src/ExecuteKernelU8S8.cc')
-rw-r--r--src/ExecuteKernelU8S8.cc28
1 files changed, 26 insertions, 2 deletions
diff --git a/src/ExecuteKernelU8S8.cc b/src/ExecuteKernelU8S8.cc
index e091a87..b3f8c15 100644
--- a/src/ExecuteKernelU8S8.cc
+++ b/src/ExecuteKernelU8S8.cc
@@ -14,7 +14,7 @@ double kernel_time = 0.0;
double postprocessing_time = 0.0;
#endif
-namespace fbgemm2 {
+namespace fbgemm {
template <typename packingAMatrix, typename cT, typename processOutputType>
ExecuteKernel<
@@ -328,6 +328,18 @@ template class ExecuteKernel<
memCopy<>>;
template class ExecuteKernel<
+ PackAWithIm2Col<uint8_t, int16_t>,
+ PackBMatrix<int8_t, int16_t>,
+ uint8_t,
+ ReQuantizeOutput<false>>;
+
+template class ExecuteKernel<
+ PackAWithIm2Col<uint8_t, int16_t, 3>,
+ PackBMatrix<int8_t, int16_t>,
+ uint8_t,
+ ReQuantizeOutput<false>>;
+
+template class ExecuteKernel<
PackAWithRowOffset<uint8_t, int32_t>,
PackBMatrix<int8_t, int32_t>,
int32_t,
@@ -346,6 +358,18 @@ template class ExecuteKernel<
memCopy<>>;
template class ExecuteKernel<
+ PackAWithIm2Col<uint8_t, int32_t>,
+ PackBMatrix<int8_t, int32_t>,
+ uint8_t,
+ ReQuantizeOutput<false>>;
+
+template class ExecuteKernel<
+ PackAWithIm2Col<uint8_t, int32_t, 3>,
+ PackBMatrix<int8_t, int32_t>,
+ uint8_t,
+ ReQuantizeOutput<false>>;
+
+template class ExecuteKernel<
PackAWithQuantRowOffset<uint8_t, int32_t>,
PackBMatrix<int8_t, int32_t>,
int32_t,
@@ -363,4 +387,4 @@ template class ExecuteKernel<
int32_t,
DoNothing<int32_t, int32_t>>;
-} // namespace fbgemm2
+} // namespace fbgemm