mirror of
https://github.com/KhronosGroup/glslang
synced 2024-11-08 11:30:06 +00:00
77 lines
1.9 KiB
Plaintext
77 lines
1.9 KiB
Plaintext
#version 450 core
|
|
#extension GL_KHR_memory_scope_semantics : enable
|
|
#extension GL_NV_cooperative_matrix : enable
|
|
#extension GL_EXT_shader_explicit_arithmetic_types_float16 : enable
|
|
|
|
layout (local_size_x = 64, local_size_y = 1, local_size_z = 1) in;
|
|
|
|
float<16> ftemplate16;
|
|
|
|
fcoopmatNV fnoparams;
|
|
|
|
fcoopmatNV<8, gl_ScopeSubgroup, 8, 8> fbadbits;
|
|
|
|
fcoopmatNV<16, gl_ScopeSubgroup, 8> fbadnumparams;
|
|
|
|
int X = 8;
|
|
|
|
fcoopmatNV<16, gl_ScopeSubgroup, 8, X> fbadparam;
|
|
|
|
layout(constant_id = 0) int Y = 1;
|
|
|
|
shared fcoopmatNV<16, gl_ScopeSubgroup, 16, 16> sharedmat;
|
|
|
|
layout(set = 0, binding = 0) buffer InvBlock {
|
|
fcoopmatNV<16, gl_ScopeSubgroup, 16, 16> bufmat;
|
|
} invblock;
|
|
|
|
void main()
|
|
{
|
|
fcoopmatNV<32, gl_ScopeSubgroup, 16, 8> f32_16_8;
|
|
fcoopmatNV<16, gl_ScopeSubgroup, 16, 8> f16_16_8;
|
|
|
|
// invalid implicit conversions
|
|
f32_16_8 = f16_16_8;
|
|
f32_16_8 = f16_16_8 + f16_16_8;
|
|
|
|
fcoopmatNV<16, gl_ScopeSubgroup, 8, 8> f16_8_8;
|
|
|
|
// mismatching dimensions
|
|
f16_16_8 = f16_8_8;
|
|
|
|
fcoopmatNV<16, gl_ScopeSubgroup, 8, Y> f16_8_Y;
|
|
fcoopmatNV<16, gl_ScopeSubgroup, 8, (Y+1)> f16_8_Y1;
|
|
|
|
// mismatching dimensions with specialization constants
|
|
f16_8_Y = f16_8_Y1;
|
|
|
|
// wrong arguments for constructor
|
|
f16_8_8 = fcoopmatNV<16, gl_ScopeSubgroup, 8, 8>(1, 1);
|
|
|
|
// can't construct from a builtin type
|
|
mat4 m4;
|
|
fcoopmatNV<32, gl_ScopeSubgroup, 4, 4> f32_4_4 = fcoopmatNV<32, gl_ScopeSubgroup, 4, 4>(m4);
|
|
|
|
// only support a single array subscript
|
|
f16_16_8[0][0];
|
|
|
|
// don't support scalar component selection
|
|
f16_16_8.x;
|
|
|
|
f16_16_8 * f16_16_8;
|
|
|
|
f16_16_8 + 1.0;
|
|
f16_16_8 - 1.0;
|
|
f16_16_8 / 1.0;
|
|
f16_16_8 += 1.0;
|
|
f16_16_8 -= 1.0;
|
|
f16_16_8 /= 1.0;
|
|
|
|
f16_16_8*2.0;
|
|
2.0*f16_16_8;
|
|
f32_16_8*float16_t(2.0);
|
|
float16_t(2.0)*f32_16_8;
|
|
|
|
transpose(f16_8_8);
|
|
}
|