85 lines
2.7 KiB
Plaintext
85 lines
2.7 KiB
Plaintext
#pragma clang diagnostic ignored "-Wmissing-prototypes"
|
|
|
|
#include <metal_stdlib>
|
|
#include <simd/simd.h>
|
|
|
|
using namespace metal;
|
|
|
|
struct SSBOCol
|
|
{
|
|
float2x3 col_major0;
|
|
float2x3 col_major1;
|
|
};
|
|
|
|
struct SSBORow
|
|
{
|
|
float3x4 row_major0;
|
|
float3x4 row_major1;
|
|
};
|
|
|
|
void load_store_to_variable_col_major(device SSBOCol& v_29)
|
|
{
|
|
float2x3 loaded = v_29.col_major0;
|
|
v_29.col_major1 = loaded;
|
|
}
|
|
|
|
void load_store_to_variable_row_major(device SSBORow& v_41)
|
|
{
|
|
float2x3 loaded = transpose(float2x3(v_41.row_major0[0].xy, v_41.row_major0[1].xy, v_41.row_major0[2].xy));
|
|
v_41.row_major0[0].xy = float2(loaded[0][0], loaded[1][0]));
|
|
v_41.row_major0[1].xy = float2(loaded[0][1], loaded[1][1]));
|
|
v_41.row_major0[2].xy = float2(loaded[0][2], loaded[1][2]));
|
|
}
|
|
|
|
void copy_col_major_to_col_major(device SSBOCol& v_29)
|
|
{
|
|
v_29.col_major0 = v_29.col_major1;
|
|
}
|
|
|
|
void copy_col_major_to_row_major(device SSBOCol& v_29, device SSBORow& v_41)
|
|
{
|
|
v_41.row_major0[0].xy = float2(v_29.col_major0[0][0], v_29.col_major0[1][0]));
|
|
v_41.row_major0[1].xy = float2(v_29.col_major0[0][1], v_29.col_major0[1][1]));
|
|
v_41.row_major0[2].xy = float2(v_29.col_major0[0][2], v_29.col_major0[1][2]));
|
|
}
|
|
|
|
void copy_row_major_to_col_major(device SSBOCol& v_29, device SSBORow& v_41)
|
|
{
|
|
v_29.col_major0 = transpose(float2x3(v_41.row_major0[0].xy, v_41.row_major0[1].xy, v_41.row_major0[2].xy));
|
|
}
|
|
|
|
void copy_row_major_to_row_major(device SSBORow& v_41)
|
|
{
|
|
v_41.row_major0[0].xy = float2x3(v_41.row_major1[0], v_41.row_major1[1])[0];
|
|
v_41.row_major0[1].xy = float2x3(v_41.row_major1[0], v_41.row_major1[1])[1];
|
|
v_41.row_major0[2].xy = float2x3(v_41.row_major1[0], v_41.row_major1[1])[2];
|
|
}
|
|
|
|
void copy_columns(device SSBOCol& v_29, device SSBORow& v_41)
|
|
{
|
|
v_29.col_major0[1] = float3(v_41.row_major0[0][1], v_41.row_major0[1][1], v_41.row_major0[2][1]);
|
|
v_41.row_major0[1][0].x = float(v_29.col_major0[1][0][0]));
|
|
v_41.row_major0[1][1].x = float(v_29.col_major0[1][0][1]));
|
|
v_41.row_major0[1][2].x = float(v_29.col_major0[1][0][2]));
|
|
device float3*(v_41.row_major0[0][1], v_41.row_major0[1][1], v_41.row_major0[2][1]) = v_29.col_major0[1];
|
|
}
|
|
|
|
void copy_elements(device SSBOCol& v_29, device SSBORow& v_41)
|
|
{
|
|
v_29.col_major0[0].y = v_41.row_major0[1u][0];
|
|
v_41.row_major0[1u][0] = v_29.col_major0[0].y;
|
|
}
|
|
|
|
kernel void main0(device SSBOCol& v_29 [[buffer(0)]], device SSBORow& v_41 [[buffer(1)]])
|
|
{
|
|
load_store_to_variable_col_major(v_29);
|
|
load_store_to_variable_row_major(v_41);
|
|
copy_col_major_to_col_major(v_29);
|
|
copy_col_major_to_row_major(v_29, v_41);
|
|
copy_row_major_to_col_major(v_29, v_41);
|
|
copy_row_major_to_row_major(v_41);
|
|
copy_columns(v_29, v_41);
|
|
copy_elements(v_29, v_41);
|
|
}
|
|
|