65 lines
3.4 KiB
GLSL
65 lines
3.4 KiB
GLSL
|
#pragma clang diagnostic ignored "-Wmissing-prototypes"
|
||
|
#pragma clang diagnostic ignored "-Wunused-variable"
|
||
|
|
||
|
#include <metal_stdlib>
|
||
|
#include <simd/simd.h>
|
||
|
#include <metal_atomic>
|
||
|
|
||
|
using namespace metal;
|
||
|
|
||
|
// The required alignment of a linear texture of R32Uint format.
|
||
|
constant uint spvLinearTextureAlignmentOverride [[function_constant(65535)]];
|
||
|
constant uint spvLinearTextureAlignment = is_function_constant_defined(spvLinearTextureAlignmentOverride) ? spvLinearTextureAlignmentOverride : 4;
|
||
|
// Returns buffer coords corresponding to 2D texture coords for emulating 2D texture atomics
|
||
|
#define spvImage2DAtomicCoord(tc, tex) (((((tex).get_width() + spvLinearTextureAlignment / 4 - 1) & ~( spvLinearTextureAlignment / 4 - 1)) * (tc).y) + (tc).x)
|
||
|
|
||
|
struct foo_t
|
||
|
{
|
||
|
float x;
|
||
|
uint y;
|
||
|
};
|
||
|
|
||
|
struct main0_out
|
||
|
{
|
||
|
float4 fragColor [[color(0)]];
|
||
|
};
|
||
|
|
||
|
fragment main0_out main0(device foo_t& foo [[buffer(0)]], texture2d<uint, access::write> bar [[texture(0)]], device atomic_uint* bar_atomic [[buffer(1)]], float4 gl_FragCoord [[position]])
|
||
|
{
|
||
|
main0_out out = {};
|
||
|
bool gl_HelperInvocation = {};
|
||
|
gl_HelperInvocation = simd_is_helper_thread();
|
||
|
if (!gl_HelperInvocation)
|
||
|
{
|
||
|
foo.x = 1.0;
|
||
|
}
|
||
|
uint _90 = (!gl_HelperInvocation ? atomic_exchange_explicit((device atomic_uint*)&foo.y, 0u, memory_order_relaxed) : atomic_load_explicit((device atomic_uint*)&foo.y, memory_order_relaxed));
|
||
|
if (int(gl_FragCoord.x) == 3)
|
||
|
{
|
||
|
gl_HelperInvocation = true, discard_fragment();
|
||
|
}
|
||
|
int2 _100 = int2(gl_FragCoord.xy);
|
||
|
(gl_HelperInvocation ? ((void)0) : bar.write(uint4(1u), uint2(_100)));
|
||
|
uint _102 = (!gl_HelperInvocation ? atomic_fetch_add_explicit((device atomic_uint*)&foo.y, 42u, memory_order_relaxed) : atomic_load_explicit((device atomic_uint*)&foo.y, memory_order_relaxed));
|
||
|
uint _107 = (!gl_HelperInvocation ? atomic_fetch_or_explicit((device atomic_uint*)&bar_atomic[spvImage2DAtomicCoord(_100, bar)], 62u, memory_order_relaxed) : atomic_load_explicit((device atomic_uint*)&bar_atomic[spvImage2DAtomicCoord(_100, bar)], memory_order_relaxed));
|
||
|
uint _109 = (!gl_HelperInvocation ? atomic_fetch_and_explicit((device atomic_uint*)&foo.y, 65535u, memory_order_relaxed) : atomic_load_explicit((device atomic_uint*)&foo.y, memory_order_relaxed));
|
||
|
uint _111 = (!gl_HelperInvocation ? atomic_fetch_xor_explicit((device atomic_uint*)&foo.y, 4294967040u, memory_order_relaxed) : atomic_load_explicit((device atomic_uint*)&foo.y, memory_order_relaxed));
|
||
|
uint _113 = (!gl_HelperInvocation ? atomic_fetch_min_explicit((device atomic_uint*)&foo.y, 1u, memory_order_relaxed) : atomic_load_explicit((device atomic_uint*)&foo.y, memory_order_relaxed));
|
||
|
uint _118 = (!gl_HelperInvocation ? atomic_fetch_max_explicit((device atomic_uint*)&bar_atomic[spvImage2DAtomicCoord(_100, bar)], 100u, memory_order_relaxed) : atomic_load_explicit((device atomic_uint*)&bar_atomic[spvImage2DAtomicCoord(_100, bar)], memory_order_relaxed));
|
||
|
uint _123;
|
||
|
if (!gl_HelperInvocation)
|
||
|
{
|
||
|
do
|
||
|
{
|
||
|
_123 = 100u;
|
||
|
} while (!atomic_compare_exchange_weak_explicit((device atomic_uint*)&bar_atomic[spvImage2DAtomicCoord(_100, bar)], &_123, 42u, memory_order_relaxed, memory_order_relaxed) && _123 == 100u);
|
||
|
}
|
||
|
else
|
||
|
{
|
||
|
_123 = atomic_load_explicit((device atomic_uint*)&bar_atomic[spvImage2DAtomicCoord(_100, bar)], memory_order_relaxed);
|
||
|
}
|
||
|
out.fragColor = float4(1.0, 0.0, 0.0, 1.0);
|
||
|
return out;
|
||
|
}
|
||
|
|