static const uint3 gl_WorkGroupSize = uint3(1u, 1u, 1u); RWByteAddressBuffer _28 : register(u0); cbuffer UBO : register(b1) { int _68_index0 : packoffset(c0); int _68_index1 : packoffset(c0.y); }; void row_to_col() { float4x4 _55 = asfloat(uint4x4(_28.Load(64), _28.Load(80), _28.Load(96), _28.Load(112), _28.Load(68), _28.Load(84), _28.Load(100), _28.Load(116), _28.Load(72), _28.Load(88), _28.Load(104), _28.Load(120), _28.Load(76), _28.Load(92), _28.Load(108), _28.Load(124))); _28.Store4(0, asuint(_55[0])); _28.Store4(16, asuint(_55[1])); _28.Store4(32, asuint(_55[2])); _28.Store4(48, asuint(_55[3])); float2x2 _58 = asfloat(uint2x2(_28.Load(144), _28.Load(152), _28.Load(148), _28.Load(156))); _28.Store2(128, asuint(_58[0])); _28.Store2(136, asuint(_58[1])); float2x3 _61 = asfloat(uint2x3(_28.Load(192), _28.Load(200), _28.Load(208), _28.Load(196), _28.Load(204), _28.Load(212))); _28.Store3(160, asuint(_61[0])); _28.Store3(176, asuint(_61[1])); float3x2 _64 = asfloat(uint3x2(_28.Load(240), _28.Load(256), _28.Load(244), _28.Load(260), _28.Load(248), _28.Load(264))); _28.Store2(216, asuint(_64[0])); _28.Store2(224, asuint(_64[1])); _28.Store2(232, asuint(_64[2])); } void col_to_row() { float4x4 _34 = asfloat(uint4x4(_28.Load4(0), _28.Load4(16), _28.Load4(32), _28.Load4(48))); _28.Store(64, asuint(_34[0].x)); _28.Store(68, asuint(_34[1].x)); _28.Store(72, asuint(_34[2].x)); _28.Store(76, asuint(_34[3].x)); _28.Store(80, asuint(_34[0].y)); _28.Store(84, asuint(_34[1].y)); _28.Store(88, asuint(_34[2].y)); _28.Store(92, asuint(_34[3].y)); _28.Store(96, asuint(_34[0].z)); _28.Store(100, asuint(_34[1].z)); _28.Store(104, asuint(_34[2].z)); _28.Store(108, asuint(_34[3].z)); _28.Store(112, asuint(_34[0].w)); _28.Store(116, asuint(_34[1].w)); _28.Store(120, asuint(_34[2].w)); _28.Store(124, asuint(_34[3].w)); float2x2 _40 = asfloat(uint2x2(_28.Load2(128), _28.Load2(136))); _28.Store(144, asuint(_40[0].x)); _28.Store(148, asuint(_40[1].x)); _28.Store(152, asuint(_40[0].y)); _28.Store(156, asuint(_40[1].y)); float2x3 _46 = asfloat(uint2x3(_28.Load3(160), _28.Load3(176))); _28.Store(192, asuint(_46[0].x)); _28.Store(196, asuint(_46[1].x)); _28.Store(200, asuint(_46[0].y)); _28.Store(204, asuint(_46[1].y)); _28.Store(208, asuint(_46[0].z)); _28.Store(212, asuint(_46[1].z)); float3x2 _52 = asfloat(uint3x2(_28.Load2(216), _28.Load2(224), _28.Load2(232))); _28.Store(240, asuint(_52[0].x)); _28.Store(244, asuint(_52[1].x)); _28.Store(248, asuint(_52[2].x)); _28.Store(256, asuint(_52[0].y)); _28.Store(260, asuint(_52[1].y)); _28.Store(264, asuint(_52[2].y)); } void write_dynamic_index_row() { _28.Store(_68_index0 * 4 + _68_index1 * 16 + 64, asuint(1.0f)); _28.Store(_68_index0 * 4 + _68_index1 * 8 + 144, asuint(2.0f)); _28.Store(_68_index0 * 4 + _68_index1 * 8 + 192, asuint(3.0f)); _28.Store(_68_index0 * 4 + _68_index1 * 16 + 240, asuint(4.0f)); _28.Store(_68_index0 * 4 + 64, asuint(1.0f.x)); _28.Store(_68_index0 * 4 + 80, asuint(1.0f.xxxx.y)); _28.Store(_68_index0 * 4 + 96, asuint(1.0f.xxxx.z)); _28.Store(_68_index0 * 4 + 112, asuint(1.0f.xxxx.w)); _28.Store(_68_index0 * 4 + 144, asuint(2.0f.x)); _28.Store(_68_index0 * 4 + 152, asuint(2.0f.xx.y)); _28.Store(_68_index0 * 4 + 192, asuint(3.0f.x)); _28.Store(_68_index0 * 4 + 200, asuint(3.0f.xxx.y)); _28.Store(_68_index0 * 4 + 208, asuint(3.0f.xxx.z)); _28.Store(_68_index0 * 4 + 240, asuint(4.0f.x)); _28.Store(_68_index0 * 4 + 256, asuint(4.0f.xx.y)); } void write_dynamic_index_col() { _28.Store(_68_index0 * 16 + _68_index1 * 4 + 0, asuint(1.0f)); _28.Store(_68_index0 * 8 + _68_index1 * 4 + 128, asuint(2.0f)); _28.Store(_68_index0 * 16 + _68_index1 * 4 + 160, asuint(3.0f)); _28.Store(_68_index0 * 8 + _68_index1 * 4 + 216, asuint(4.0f)); _28.Store4(_68_index0 * 16 + 0, asuint(1.0f.xxxx)); _28.Store2(_68_index0 * 8 + 128, asuint(2.0f.xx)); _28.Store3(_68_index0 * 16 + 160, asuint(3.0f.xxx)); _28.Store2(_68_index0 * 8 + 216, asuint(4.0f.xx)); } void read_dynamic_index_row() { float a0 = asfloat(_28.Load(_68_index0 * 4 + _68_index1 * 16 + 64)); float a1 = asfloat(_28.Load(_68_index0 * 4 + _68_index1 * 8 + 144)); float a2 = asfloat(_28.Load(_68_index0 * 4 + _68_index1 * 8 + 192)); float a3 = asfloat(_28.Load(_68_index0 * 4 + _68_index1 * 16 + 240)); float4 v0 = asfloat(uint4(_28.Load(_68_index0 * 4 + 64), _28.Load(_68_index0 * 4 + 80), _28.Load(_68_index0 * 4 + 96), _28.Load(_68_index0 * 4 + 112))); float2 v1 = asfloat(uint2(_28.Load(_68_index0 * 4 + 144), _28.Load(_68_index0 * 4 + 152))); float3 v2 = asfloat(uint3(_28.Load(_68_index0 * 4 + 192), _28.Load(_68_index0 * 4 + 200), _28.Load(_68_index0 * 4 + 208))); float2 v3 = asfloat(uint2(_28.Load(_68_index0 * 4 + 240), _28.Load(_68_index0 * 4 + 256))); } void read_dynamic_index_col() { float a0 = asfloat(_28.Load(_68_index0 * 16 + _68_index1 * 4 + 0)); float a1 = asfloat(_28.Load(_68_index0 * 8 + _68_index1 * 4 + 128)); float a2 = asfloat(_28.Load(_68_index0 * 16 + _68_index1 * 4 + 160)); float a3 = asfloat(_28.Load(_68_index0 * 8 + _68_index1 * 4 + 216)); float4 v0 = asfloat(_28.Load4(_68_index0 * 16 + 0)); float2 v1 = asfloat(_28.Load2(_68_index0 * 8 + 128)); float3 v2 = asfloat(_28.Load3(_68_index0 * 16 + 160)); float2 v3 = asfloat(_28.Load2(_68_index0 * 8 + 216)); } void comp_main() { row_to_col(); col_to_row(); write_dynamic_index_row(); write_dynamic_index_col(); read_dynamic_index_row(); read_dynamic_index_col(); } [numthreads(1, 1, 1)] void main() { comp_main(); }