1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
|
/*
* Copyright (c) Facebook, Inc. and its affiliates.
* All rights reserved.
* This source code is licensed under the BSD-style license found in the
* LICENSE file in the root directory of this source tree.
*/
#include "TestUtils.h"
#include <gtest/gtest.h>
#include "fbgemm/Fbgemm.h"
#include "bench/AlignedVec.h"
namespace fbgemm2 {
template <typename T>
int compare_validate_buffers(
const T* ref,
const T* test,
int m,
int n,
int ld,
T atol) {
for (int i = 0; i < m; ++i) {
for (int j = 0; j < n; ++j) {
if (std::is_integral<T>::value) {
EXPECT_EQ(ref[i * ld + j], test[i * ld + j])
<< "GEMM results differ at (" << i << ", " << j
<< ") reference: " << (int64_t)ref[i * ld + j]
<< ", FBGEMM: " << (int64_t)test[i * ld + j];
} else {
EXPECT_LE(std::abs(ref[i * ld + j] - test[i * ld + j]), atol)
<< "GEMM results differ at (" << i << ", " << j
<< ") reference: " << ref[i * ld + j]
<< ", FBGEMM: " << test[i * ld + j];
}
}
}
return 0;
}
template int compare_validate_buffers<float>(
const float* ref,
const float* test,
int m,
int n,
int ld,
float atol);
template int compare_validate_buffers<int32_t>(
const int32_t* ref,
const int32_t* test,
int m,
int n,
int ld,
int32_t atol);
template int compare_validate_buffers<uint8_t>(
const uint8_t* ref,
const uint8_t* test,
int m,
int n,
int ld,
uint8_t atol);
template <typename T>
bool check_all_zero_entries(const T* test, int m, int n) {
for (int i = 0; i < m; ++i) {
for (int j = 0; j < n; ++j) {
if (test[i * n + j] != 0)
return true;
}
}
return false;
}
template bool check_all_zero_entries<float>(const float* test, int m, int n);
template bool
check_all_zero_entries<int32_t>(const int32_t* test, int m, int n);
template bool
check_all_zero_entries<uint8_t>(const uint8_t* test, int m, int n);
template <typename T>
void transpose_matrix(T* ref, int n, int k) {
aligned_vector<T> local(n * k, 0);
for (int i = 0; i < n; ++i) {
for (int j = 0; j < k; ++j) {
local[j * n + i] = ref[i * k + j];
}
}
for (int i = 0; i < k; ++i) {
for (int j = 0; j < n; ++j) {
ref[i * n + j] = local[i * n + j];
}
}
}
template void transpose_matrix<float>(float* ref, int n, int k);
template void transpose_matrix<int32_t>(int32_t* ref, int n, int k);
template void transpose_matrix<uint8_t>(uint8_t* ref, int n, int k);
template void transpose_matrix<int8_t>(int8_t* ref, int n, int k);
} // namespace fbgemm2
|