Welcome to mirror list, hosted at ThFree Co, Russian Federation.

github.com/marian-nmt/FBGEMM.git - Unnamed repository; edit this file 'description' to name the repository.
summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
Diffstat (limited to 'src/GenerateKernel.h')
-rw-r--r--src/GenerateKernel.h13
1 files changed, 12 insertions, 1 deletions
diff --git a/src/GenerateKernel.h b/src/GenerateKernel.h
index 7c0368b..7d8ac05 100644
--- a/src/GenerateKernel.h
+++ b/src/GenerateKernel.h
@@ -59,7 +59,15 @@ class CodeGenBase {
x86::zmm15, x86::zmm16, x86::zmm17, x86::zmm18, x86::zmm19,
x86::zmm20, x86::zmm21, x86::zmm22, x86::zmm23, x86::zmm24,
x86::zmm25, x86::zmm26, x86::zmm27,
- } {
+ },
+ AllRegs_avx512_{x86::zmm0, x86::zmm1, x86::zmm2, x86::zmm3,
+ x86::zmm4, x86::zmm5, x86::zmm6, x86::zmm7,
+ x86::zmm8, x86::zmm9, x86::zmm10, x86::zmm11,
+ x86::zmm12, x86::zmm13, x86::zmm14, x86::zmm15,
+ x86::zmm16, x86::zmm17, x86::zmm18, x86::zmm19,
+ x86::zmm20, x86::zmm21, x86::zmm22, x86::zmm23,
+ x86::zmm24, x86::zmm25, x86::zmm26, x86::zmm27,
+ x86::zmm28, x86::zmm29, x86::zmm30, x86::zmm31} {
// vector width in bits
if (cpuinfo_initialize()) {
if (fbgemmHasAvx512Support()) {
@@ -159,6 +167,9 @@ class CodeGenBase {
CRegs_avx2_[12]; ///< AVX2 ymm registers for C in the micro-kernel.
asmjit::X86Zmm
CRegs_avx512_[28]; ///< AVX512 zmm registers for C in the micro-kernel.
+ asmjit::X86Zmm
+ AllRegs_avx512_[32]; ///< all AVX512 zmm registers.
+
int vectorWidth_; ///< Vector width in bits.
int VLEN_; ///< Vector width in elements.
static thread_local asmjit::JitRuntime rt_; ///< JIT Runtime for asmjit.