Welcome to mirror list, hosted at ThFree Co, Russian Federation.

github.com/marian-nmt/FBGEMM.git - Unnamed repository; edit this file 'description' to name the repository.
summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
-rw-r--r--CMakeLists.txt12
-rw-r--r--include/fbgemm/Fbgemm.h1
-rw-r--r--src/FbgemmFP16.cc2
-rw-r--r--src/FbgemmFP16UKernelsAvx2.cc (renamed from src/FbgemmFP16UKernels.cc)2
-rw-r--r--src/FbgemmFP16UKernelsAvx2.h (renamed from src/FbgemmFP16UKernels.h)2
-rw-r--r--src/GenerateKernelU8S8S32ACC16Avx512.cc (renamed from src/GenerateKernelU8S8S32ACC16_avx512.cc)0
-rw-r--r--src/GenerateKernelU8S8S32ACC32Avx512.cc (renamed from src/GenerateKernelU8S8S32ACC32_avx512.cc)0
-rw-r--r--src/UtilsAvx2.cc (renamed from src/Utils_avx2.cc)0
-rw-r--r--src/UtilsAvx512.cc (renamed from src/Utils_avx512.cc)0
-rw-r--r--src/codegen_fp16fp32.cc8
10 files changed, 10 insertions, 17 deletions
diff --git a/CMakeLists.txt b/CMakeLists.txt
index cda86b1..5d889cd 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -29,12 +29,11 @@ set(FBGEMM_GENERIC_SRCS src/ExecuteKernel.cc
src/ExecuteKernelU8S8.cc
src/Fbgemm.cc
src/FbgemmFP16.cc
- src/FbgemmFP16UKernels.cc
src/FbgemmI8Spmdm.cc
src/GenerateKernelU8S8S32ACC16.cc
- src/GenerateKernelU8S8S32ACC16_avx512.cc
+ src/GenerateKernelU8S8S32ACC16Avx512.cc
src/GenerateKernelU8S8S32ACC32.cc
- src/GenerateKernelU8S8S32ACC32_avx512.cc
+ src/GenerateKernelU8S8S32ACC32Avx512.cc
src/PackAMatrix.cc
src/PackAWithIm2Col.cc
src/PackBMatrix.cc
@@ -64,13 +63,14 @@ endif()
#All the source files that either use avx2 instructions statically
set(FBGEMM_AVX2_SRCS
+ src/FbgemmFP16UKernelsAvx2.cc
src/FbgemmI8DepthwiseAvx2.cc
src/OptimizedKernelsAvx2.cc
src/QuantUtilsAvx2.cc
- src/Utils_avx2.cc)
+ src/UtilsAvx2.cc)
#All the source files that use avx512 instructions statically
-set(FBGEMM_AVX512_SRCS src/Utils_avx512.cc)
+set(FBGEMM_AVX512_SRCS src/UtilsAvx512.cc)
set(FBGEMM_PUBLIC_HEADERS include/fbgemm/Fbgemm.h
include/fbgemm/OutputProcessing-inl.h
@@ -93,8 +93,6 @@ set_target_properties(fbgemm_generic fbgemm_avx2 fbgemm_avx512 PROPERTIES
CXX_EXTENSIONS NO
CXX_VISIBILITY_PRESET hidden)
-target_compile_options(fbgemm_generic PRIVATE
- "-m64" "-mavx2" "-mfma" "-masm=intel")
target_compile_options(fbgemm_avx2 PRIVATE
"-m64" "-mavx2" "-mfma" "-masm=intel")
target_compile_options(fbgemm_avx512 PRIVATE
diff --git a/include/fbgemm/Fbgemm.h b/include/fbgemm/Fbgemm.h
index c54bf24..5fedd28 100644
--- a/include/fbgemm/Fbgemm.h
+++ b/include/fbgemm/Fbgemm.h
@@ -9,7 +9,6 @@
/**
* Top level include file for FBGEMM.
*/
-#include <immintrin.h>
#include <cassert>
#include <cmath>
#include <limits>
diff --git a/src/FbgemmFP16.cc b/src/FbgemmFP16.cc
index 6d44c74..2af1f89 100644
--- a/src/FbgemmFP16.cc
+++ b/src/FbgemmFP16.cc
@@ -10,7 +10,7 @@
#include <array>
#include <utility>
-#include "FbgemmFP16UKernels.h"
+#include "FbgemmFP16UKernelsAvx2.h"
using namespace std;
diff --git a/src/FbgemmFP16UKernels.cc b/src/FbgemmFP16UKernelsAvx2.cc
index d915765..8a0cb0d 100644
--- a/src/FbgemmFP16UKernels.cc
+++ b/src/FbgemmFP16UKernelsAvx2.cc
@@ -4,7 +4,7 @@
* This source code is licensed under the BSD-style license found in the
* LICENSE file in the root directory of this source tree.
*/
-#include "FbgemmFP16UKernels.h"
+#include "FbgemmFP16UKernelsAvx2.h"
namespace fbgemm {
diff --git a/src/FbgemmFP16UKernels.h b/src/FbgemmFP16UKernelsAvx2.h
index d35d431..4053332 100644
--- a/src/FbgemmFP16UKernels.h
+++ b/src/FbgemmFP16UKernelsAvx2.h
@@ -7,8 +7,6 @@
#ifndef FBGEMM_UKERNELS
#define FBGEMM_UKERNELS
#include <cstdint>
-#include <tuple>
-#include <vector>
#include "fbgemm/Types.h"
namespace fbgemm {
diff --git a/src/GenerateKernelU8S8S32ACC16_avx512.cc b/src/GenerateKernelU8S8S32ACC16Avx512.cc
index eeeaea0..eeeaea0 100644
--- a/src/GenerateKernelU8S8S32ACC16_avx512.cc
+++ b/src/GenerateKernelU8S8S32ACC16Avx512.cc
diff --git a/src/GenerateKernelU8S8S32ACC32_avx512.cc b/src/GenerateKernelU8S8S32ACC32Avx512.cc
index 0621bb0..0621bb0 100644
--- a/src/GenerateKernelU8S8S32ACC32_avx512.cc
+++ b/src/GenerateKernelU8S8S32ACC32Avx512.cc
diff --git a/src/Utils_avx2.cc b/src/UtilsAvx2.cc
index badf70b..badf70b 100644
--- a/src/Utils_avx2.cc
+++ b/src/UtilsAvx2.cc
diff --git a/src/Utils_avx512.cc b/src/UtilsAvx512.cc
index f49bb6f..f49bb6f 100644
--- a/src/Utils_avx512.cc
+++ b/src/UtilsAvx512.cc
diff --git a/src/codegen_fp16fp32.cc b/src/codegen_fp16fp32.cc
index 8dd3166..17bb113 100644
--- a/src/codegen_fp16fp32.cc
+++ b/src/codegen_fp16fp32.cc
@@ -65,7 +65,7 @@ int main() {
// open all files
ofstream srcfile;
- srcfile.open("FbgemmFP16UKernels.cc");
+ srcfile.open("FbgemmFP16UKernelsAvx2.cc");
srcfile
<< "/*\n"
" * Copyright (c) Facebook, Inc. and its affiliates.\n"
@@ -73,14 +73,14 @@ int main() {
" * This source code is licensed under the BSD-style license found in the\n"
" * LICENSE file in the root directory of this source tree.\n"
" */\n";
- srcfile << "#include \"FbgemmFP16UKernels.h\"\n\n";
+ srcfile << "#include \"FbgemmFP16UKernelsAvx2.h\"\n\n";
srcfile << "namespace fbgemm {\n\n";
if (iaca) {
srcfile << "#include \"iacaMarks.h\"\n";
}
ofstream hdrfile;
- hdrfile.open("FbgemmFP16UKernels.h");
+ hdrfile.open("FbgemmFP16UKernelsAvx2.h");
hdrfile
<< "/*\n"
" * Copyright (c) Facebook, Inc. and its affiliates.\n"
@@ -92,8 +92,6 @@ int main() {
hdrfile << "#ifndef FBGEMM_UKERNELS\n";
hdrfile << "#define FBGEMM_UKERNELS\n";
hdrfile << "#include <cstdint>\n";
- hdrfile << "#include <tuple>\n";
- hdrfile << "#include <vector>\n";
hdrfile << "#include \"fbgemm/Types.h\"\n\n";
hdrfile << "namespace fbgemm {\n\n";
hdrfile << "using fp16 = float16;\n";