mirror of
https://github.com/encounter/dawn-cmake.git
synced 2025-06-30 10:23:35 +00:00
Change the DecomposeMemoryAccess to behave more like the DirectVariableAccess transform, in that it'll inline the access of buffer variable into the load / store helper functions, instead of passing the array down. This avoids large array copies observed with FXC, which can have *severe* performance costs. Fixed: tint:1819 Change-Id: I52eb3f908813f72ab9da446743e24a2637158309 Reviewed-on: https://dawn-review.googlesource.com/c/dawn/+/121460 Kokoro: Kokoro <noreply+kokoro@google.com> Auto-Submit: Ben Clayton <bclayton@google.com> Reviewed-by: James Price <jrprice@google.com> Commit-Queue: James Price <jrprice@google.com>
17 lines
581 B
HLSL
17 lines
581 B
HLSL
cbuffer cbuffer_data : register(b0, space0) {
|
|
uint4 data[5];
|
|
};
|
|
|
|
float4x3 data_load_1(uint offset) {
|
|
const uint scalar_offset = ((offset + 0u)) / 4;
|
|
const uint scalar_offset_1 = ((offset + 16u)) / 4;
|
|
const uint scalar_offset_2 = ((offset + 32u)) / 4;
|
|
const uint scalar_offset_3 = ((offset + 48u)) / 4;
|
|
return float4x3(asfloat(data[scalar_offset / 4].xyz), asfloat(data[scalar_offset_1 / 4].xyz), asfloat(data[scalar_offset_2 / 4].xyz), asfloat(data[scalar_offset_3 / 4].xyz));
|
|
}
|
|
|
|
void main() {
|
|
const float4 x = mul(data_load_1(0u), asfloat(data[4].xyz));
|
|
return;
|
|
}
|