diff options
Diffstat (limited to 'src/FbgemmFP16UKernels.h')
-rw-r--r-- | src/FbgemmFP16UKernels.h | 40 |
1 files changed, 40 insertions, 0 deletions
diff --git a/src/FbgemmFP16UKernels.h b/src/FbgemmFP16UKernels.h new file mode 100644 index 0000000..bf7f247 --- /dev/null +++ b/src/FbgemmFP16UKernels.h @@ -0,0 +1,40 @@ +/* + * Copyright (c) Facebook, Inc. and its affiliates. + * All rights reserved. + * This source code is licensed under the BSD-style license found in the + * LICENSE file in the root directory of this source tree. + */ +#ifndef FBGEMM_UKERNELS +#define FBGEMM_UKERNELS +#include <cstdint> +#include <tuple> +#include <vector> +#include "fbgemm/Types.h" + +namespace fbgemm2 { + +using fp16 = float16; +using fp32 = float; +struct GemmParams {uint64_t k; float *A; const fp16 *B; +float *beta; uint64_t accum; float *C; uint64_t ldc; +uint64_t b_block_cols; uint64_t b_block_size;}; +void __attribute__ ((noinline)) gemmkernel_1x1_AVX2_fA0fB0fC0(GemmParams *gp); +void __attribute__ ((noinline)) gemmkernel_2x1_AVX2_fA0fB0fC0(GemmParams *gp); +void __attribute__ ((noinline)) gemmkernel_3x1_AVX2_fA0fB0fC0(GemmParams *gp); +void __attribute__ ((noinline)) gemmkernel_4x1_AVX2_fA0fB0fC0(GemmParams *gp); +void __attribute__ ((noinline)) gemmkernel_5x1_AVX2_fA0fB0fC0(GemmParams *gp); +void __attribute__ ((noinline)) gemmkernel_6x1_AVX2_fA0fB0fC0(GemmParams *gp); +void __attribute__ ((noinline)) gemmkernel_7x1_AVX2_fA0fB0fC0(GemmParams *gp); +void __attribute__ ((noinline)) gemmkernel_8x1_AVX2_fA0fB0fC0(GemmParams *gp); +void __attribute__ ((noinline)) gemmkernel_9x1_AVX2_fA0fB0fC0(GemmParams *gp); +void __attribute__ ((noinline)) gemmkernel_10x1_AVX2_fA0fB0fC0(GemmParams *gp); +void __attribute__ ((noinline)) gemmkernel_11x1_AVX2_fA0fB0fC0(GemmParams *gp); +void __attribute__ ((noinline)) gemmkernel_12x1_AVX2_fA0fB0fC0(GemmParams *gp); +void __attribute__ ((noinline)) gemmkernel_13x1_AVX2_fA0fB0fC0(GemmParams *gp); +void __attribute__ ((noinline)) gemmkernel_14x1_AVX2_fA0fB0fC0(GemmParams *gp); +typedef void (* funcptr_fp16) (GemmParams *gp); +; + +} // namespace fbgemm2 + +#endif |