From edf247fb1c632a0c4487207a51151bd1f7f8aef5 Mon Sep 17 00:00:00 2001 From: Hans-Kristian Arntzen Date: Mon, 25 Oct 2021 10:55:11 +0200 Subject: MSL: Workaround compiler crashes when using threadgroup bool. Promote to short instead and do simple casts on load/store instead. Not 100% complete fix since structs can contain booleans, but this is getting into pretty ridiculously complicated territory. --- .../comp/threadgroup-boolean-workaround.comp | 20 ++++++++++++++++++++ 1 file changed, 20 insertions(+) create mode 100644 reference/opt/shaders-msl/comp/threadgroup-boolean-workaround.comp (limited to 'reference/opt/shaders-msl') diff --git a/reference/opt/shaders-msl/comp/threadgroup-boolean-workaround.comp b/reference/opt/shaders-msl/comp/threadgroup-boolean-workaround.comp new file mode 100644 index 00000000..8b80929a --- /dev/null +++ b/reference/opt/shaders-msl/comp/threadgroup-boolean-workaround.comp @@ -0,0 +1,20 @@ +#include +#include + +using namespace metal; + +struct SSBO +{ + float4 values[1]; +}; + +constant uint3 gl_WorkGroupSize [[maybe_unused]] = uint3(4u, 1u, 1u); + +kernel void main0(device SSBO& _23 [[buffer(0)]], uint gl_LocalInvocationIndex [[thread_index_in_threadgroup]], uint3 gl_GlobalInvocationID [[thread_position_in_grid]]) +{ + threadgroup short4 foo[4]; + foo[gl_LocalInvocationIndex] = short4((isunordered(_23.values[gl_GlobalInvocationID.x], float4(10.0)) || _23.values[gl_GlobalInvocationID.x] != float4(10.0))); + threadgroup_barrier(mem_flags::mem_threadgroup); + _23.values[gl_GlobalInvocationID.x] = select(float4(40.0), float4(30.0), bool4(foo[gl_LocalInvocationIndex ^ 3u])); +} + -- cgit v1.2.3