ec054dad7f
Emit synthetic functions before function constants. Support use of spvQuantizeToF16() in function constants for numerical behavior consistency with the op code. Ensure subnormal results from OpQuantizeToF16 are flushed to zero per SPIR-V spec. Adjust SPIRV-Cross unit test reference shaders to accommodate these changes. Any MSL reference shader that inclues a synthetic function is affected, since the location it is emitted has changed.
33 lines
1013 B
Plaintext
33 lines
1013 B
Plaintext
#pragma clang diagnostic ignored "-Wmissing-prototypes"
|
|
|
|
#include <metal_stdlib>
|
|
#include <simd/simd.h>
|
|
|
|
using namespace metal;
|
|
|
|
// Returns 2D texture coords corresponding to 1D texel buffer coords
|
|
static inline __attribute__((always_inline))
|
|
uint2 spvTexelBufferCoord(uint tc)
|
|
{
|
|
return uint2(tc % 4096, tc / 4096);
|
|
}
|
|
|
|
struct cb5_struct
|
|
{
|
|
float4 _m0[5];
|
|
};
|
|
|
|
kernel void main0(constant cb5_struct& cb0_5 [[buffer(0)]], texture2d<uint, access::write> u0 [[texture(0)]], uint3 gl_LocalInvocationID [[thread_position_in_threadgroup]])
|
|
{
|
|
float4 r0;
|
|
r0.x = as_type<float>(int(gl_LocalInvocationID.x) << 4);
|
|
r0.y = as_type<float>(int(gl_LocalInvocationID.x));
|
|
uint _44 = as_type<uint>(r0.x) >> 2u;
|
|
uint4 _51 = as_type<uint4>(cb0_5._m0[uint(as_type<int>(r0.y)) + 1u]);
|
|
u0.write(_51.xxxx, spvTexelBufferCoord(_44));
|
|
u0.write(_51.yyyy, spvTexelBufferCoord((_44 + 1u)));
|
|
u0.write(_51.zzzz, spvTexelBufferCoord((_44 + 2u)));
|
|
u0.write(_51.wwww, spvTexelBufferCoord((_44 + 3u)));
|
|
}
|
|
|