42 lines
1.1 KiB
HLSL
42 lines
1.1 KiB
HLSL
struct Uniforms {
|
|
uint2 aShape;
|
|
uint2 bShape;
|
|
uint2 outShape;
|
|
};
|
|
struct tint_symbol_1 {
|
|
uint3 global_id : SV_DispatchThreadID;
|
|
};
|
|
|
|
ConstantBuffer<Uniforms> uniforms : register(b3, space0);
|
|
|
|
ByteAddressBuffer firstMatrix : register(t0, space0);
|
|
ByteAddressBuffer secondMatrix : register(t1, space0);
|
|
RWByteAddressBuffer resultMatrix : register(u2, space0);
|
|
|
|
[numthreads(2, 2, 1)]
|
|
void main(tint_symbol_1 tint_symbol) {
|
|
const uint3 global_id = tint_symbol.global_id;
|
|
const uint2 resultCell = uint2(global_id.y, global_id.x);
|
|
const uint dimInner = uniforms.aShape.y;
|
|
const uint dimOutter = uniforms.outShape.y;
|
|
uint result = 0u;
|
|
{
|
|
uint i = 0u;
|
|
while (true) {
|
|
if (!((i < dimInner))) {
|
|
break;
|
|
}
|
|
const uint a = (i + (resultCell.x * dimInner));
|
|
const uint b = (resultCell.y + (i * dimOutter));
|
|
result = (result + (firstMatrix.Load((4u * a)) * secondMatrix.Load((4u * b))));
|
|
{
|
|
i = (i + 1u);
|
|
}
|
|
}
|
|
}
|
|
const uint index = (resultCell.y + (resultCell.x * dimOutter));
|
|
resultMatrix.Store((4u * index), asuint(result));
|
|
return;
|
|
}
|
|
|