1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
|
#pragma clang diagnostic ignored "-Wmissing-prototypes"
#include <metal_stdlib>
#include <simd/simd.h>
using namespace metal;
template<typename T>
[[clang::optnone]] T spvFMul(T l, T r)
{
return fma(l, r, T(0));
}
template<typename T, int Cols, int Rows>
[[clang::optnone]] vec<T, Cols> spvFMulVectorMatrix(vec<T, Rows> v, matrix<T, Cols, Rows> m)
{
vec<T, Cols> res = vec<T, Cols>(0);
for (uint i = Rows; i > 0; --i)
{
vec<T, Cols> tmp(0);
for (uint j = 0; j < Cols; ++j)
{
tmp[j] = m[j][i - 1];
}
res = fma(tmp, vec<T, Cols>(v[i - 1]), res);
}
return res;
}
template<typename T, int Cols, int Rows>
[[clang::optnone]] vec<T, Rows> spvFMulMatrixVector(matrix<T, Cols, Rows> m, vec<T, Cols> v)
{
vec<T, Rows> res = vec<T, Rows>(0);
for (uint i = Cols; i > 0; --i)
{
res = fma(m[i - 1], vec<T, Rows>(v[i - 1]), res);
}
return res;
}
template<typename T, int LCols, int LRows, int RCols, int RRows>
[[clang::optnone]] matrix<T, RCols, LRows> spvFMulMatrixMatrix(matrix<T, LCols, LRows> l, matrix<T, RCols, RRows> r)
{
matrix<T, RCols, LRows> res;
for (uint i = 0; i < RCols; i++)
{
vec<T, RCols> tmp(0);
for (uint j = 0; j < LCols; j++)
{
tmp = fma(vec<T, RCols>(r[i][j]), l[j], tmp);
}
res[i] = tmp;
}
return res;
}
template<typename T>
[[clang::optnone]] T spvFAdd(T l, T r)
{
return fma(T(1), l, r);
}
template<typename T>
[[clang::optnone]] T spvFSub(T l, T r)
{
return fma(T(-1), r, l);
}
struct main0_out
{
float4 gl_Position [[position]];
};
struct main0_in
{
float4 vA [[attribute(0)]];
float4 vB [[attribute(1)]];
float4 vC [[attribute(2)]];
};
vertex main0_out main0(main0_in in [[stage_in]])
{
main0_out out = {};
float4 _15 = spvFMul(in.vA, in.vB);
out.gl_Position = spvFAdd(spvFAdd(spvFAdd(_15, spvFAdd(in.vA, in.vB)), spvFSub(in.vA, in.vB)), spvFAdd(_15, in.vC));
return out;
}
|