mirror of
https://github.com/encounter/dawn-cmake.git
synced 2025-10-24 02:35:52 +00:00
In order to preserve padding properly for MSL, we need to use its packed_vec type for all vec3 types in storage buffers, not just struct members. This commit includes a complete rewrite of the PackedVec3 transform to achieve this. The key details are: * An internal `__packed_vec3<>` type was added, which corresponds to a `type::Vector` with an additional flag to indicate that it will be emitted as packed vector. * The `PackedVec3` transform replaces all vec3 types used in host-shareable address spaces with the internal `__packed_vec3` type. This includes vec3 types that appear as the store type of a pointer. * When used as an array element, these `__packed_vec3` types are wrapped in a struct that contains a single `__packed_vec3` member. This allows us to add an `@align()` attribute that ensures that `array<vec3<T>>` still has the correct array element stride. * When the `vec3<T>` appears as a struct member in the input program, we apply the `@align()` to that member to ensure that we do not change its offset. * Matrix types with three rows that are used in memory are replaced with an array of columns, where each column uses a `__packed_vec3` inside an aligned wrapper structure as above. * Accesses to host-shareable memory that involve any of these types invoke a "pack" or "unpack" helper function to convert them to the equivalent type that uses `__packed_vec3` or a regular `vec3` as required. * The `chromium_internal_relaxed_uniform_layout` extension is used to avoid issues where modifying a type in the uniform address space triggers stricter layout validation rules. Bug: tint:1571 Fixed: tint:1837 Change-Id: Idaf2da2f5bcb2be00c85ec657edfb614186476bb Reviewed-on: https://dawn-review.googlesource.com/c/dawn/+/121200 Reviewed-by: Ben Clayton <bclayton@google.com> Commit-Queue: James Price <jrprice@google.com> Kokoro: Kokoro <noreply+kokoro@google.com>
132 lines
5.5 KiB
Plaintext
132 lines
5.5 KiB
Plaintext
#include <metal_stdlib>
|
|
|
|
using namespace metal;
|
|
|
|
template<typename T, size_t N>
|
|
struct tint_array {
|
|
const constant T& operator[](size_t i) const constant { return elements[i]; }
|
|
device T& operator[](size_t i) device { return elements[i]; }
|
|
const device T& operator[](size_t i) const device { return elements[i]; }
|
|
thread T& operator[](size_t i) thread { return elements[i]; }
|
|
const thread T& operator[](size_t i) const thread { return elements[i]; }
|
|
threadgroup T& operator[](size_t i) threadgroup { return elements[i]; }
|
|
const threadgroup T& operator[](size_t i) const threadgroup { return elements[i]; }
|
|
T elements[N];
|
|
};
|
|
|
|
struct tint_packed_vec3_f32_array_element {
|
|
/* 0x0000 */ packed_float3 elements;
|
|
/* 0x000c */ tint_array<int8_t, 4> tint_pad;
|
|
};
|
|
|
|
struct GammaTransferParams {
|
|
/* 0x0000 */ float G;
|
|
/* 0x0004 */ float A;
|
|
/* 0x0008 */ float B;
|
|
/* 0x000c */ float C;
|
|
/* 0x0010 */ float D;
|
|
/* 0x0014 */ float E;
|
|
/* 0x0018 */ float F;
|
|
/* 0x001c */ uint padding;
|
|
};
|
|
|
|
struct ExternalTextureParams_tint_packed_vec3 {
|
|
/* 0x0000 */ uint numPlanes;
|
|
/* 0x0004 */ uint doYuvToRgbConversionOnly;
|
|
/* 0x0008 */ tint_array<int8_t, 8> tint_pad_1;
|
|
/* 0x0010 */ float3x4 yuvToRgbConversionMatrix;
|
|
/* 0x0040 */ GammaTransferParams gammaDecodeParams;
|
|
/* 0x0060 */ GammaTransferParams gammaEncodeParams;
|
|
/* 0x0080 */ tint_array<tint_packed_vec3_f32_array_element, 3> gamutConversionMatrix;
|
|
/* 0x00b0 */ float3x2 coordTransformationMatrix;
|
|
/* 0x00c8 */ tint_array<int8_t, 8> tint_pad_2;
|
|
};
|
|
|
|
float3x3 tint_unpack_vec3_in_composite(tint_array<tint_packed_vec3_f32_array_element, 3> in) {
|
|
float3x3 result = float3x3(0.0f);
|
|
for(uint i = 0u; (i < 3u); i = (i + 1u)) {
|
|
result[i] = float3(in[i].elements);
|
|
}
|
|
return result;
|
|
}
|
|
|
|
struct ExternalTextureParams {
|
|
uint numPlanes;
|
|
uint doYuvToRgbConversionOnly;
|
|
float3x4 yuvToRgbConversionMatrix;
|
|
GammaTransferParams gammaDecodeParams;
|
|
GammaTransferParams gammaEncodeParams;
|
|
float3x3 gamutConversionMatrix;
|
|
float3x2 coordTransformationMatrix;
|
|
};
|
|
|
|
ExternalTextureParams tint_unpack_vec3_in_composite_1(ExternalTextureParams_tint_packed_vec3 in) {
|
|
ExternalTextureParams result = {};
|
|
result.numPlanes = in.numPlanes;
|
|
result.doYuvToRgbConversionOnly = in.doYuvToRgbConversionOnly;
|
|
result.yuvToRgbConversionMatrix = in.yuvToRgbConversionMatrix;
|
|
result.gammaDecodeParams = in.gammaDecodeParams;
|
|
result.gammaEncodeParams = in.gammaEncodeParams;
|
|
result.gamutConversionMatrix = tint_unpack_vec3_in_composite(in.gamutConversionMatrix);
|
|
result.coordTransformationMatrix = in.coordTransformationMatrix;
|
|
return result;
|
|
}
|
|
|
|
float3 gammaCorrection(float3 v, GammaTransferParams params) {
|
|
bool3 const cond = (fabs(v) < float3(params.D));
|
|
float3 const t = (sign(v) * ((params.C * fabs(v)) + params.F));
|
|
float3 const f = (sign(v) * (pow(((params.A * fabs(v)) + params.B), float3(params.G)) + params.E));
|
|
return select(f, t, cond);
|
|
}
|
|
|
|
float4 textureLoadExternal(texture2d<float, access::sample> plane0, texture2d<float, access::sample> plane1, int2 coord, ExternalTextureParams params) {
|
|
int2 const coord1 = (coord >> uint2(1u));
|
|
float3 color = 0.0f;
|
|
if ((params.numPlanes == 1u)) {
|
|
color = plane0.read(uint2(coord), 0).rgb;
|
|
} else {
|
|
color = (float4(plane0.read(uint2(coord), 0)[0], plane1.read(uint2(coord1), 0).rg, 1.0f) * params.yuvToRgbConversionMatrix);
|
|
}
|
|
if ((params.doYuvToRgbConversionOnly == 0u)) {
|
|
color = gammaCorrection(color, params.gammaDecodeParams);
|
|
color = (params.gamutConversionMatrix * color);
|
|
color = gammaCorrection(color, params.gammaEncodeParams);
|
|
}
|
|
return float4(color, 1.0f);
|
|
}
|
|
|
|
float4 textureLoad2d(texture2d<float, access::sample> tint_symbol, texture2d<float, access::sample> ext_tex_plane_1_1, ExternalTextureParams ext_tex_params_1, int2 coords) {
|
|
return textureLoadExternal(tint_symbol, ext_tex_plane_1_1, coords, ext_tex_params_1);
|
|
}
|
|
|
|
void doTextureLoad(texture2d<float, access::sample> tint_symbol_2, texture2d<float, access::sample> tint_symbol_3, const constant ExternalTextureParams_tint_packed_vec3* const tint_symbol_4) {
|
|
float4 res = textureLoad2d(tint_symbol_2, tint_symbol_3, tint_unpack_vec3_in_composite_1(*(tint_symbol_4)), int2(0));
|
|
}
|
|
|
|
struct tint_symbol_1 {
|
|
float4 value [[position]];
|
|
};
|
|
|
|
float4 vertex_main_inner(texture2d<float, access::sample> tint_symbol_5, texture2d<float, access::sample> tint_symbol_6, const constant ExternalTextureParams_tint_packed_vec3* const tint_symbol_7) {
|
|
doTextureLoad(tint_symbol_5, tint_symbol_6, tint_symbol_7);
|
|
return float4(0.0f);
|
|
}
|
|
|
|
vertex tint_symbol_1 vertex_main(texture2d<float, access::sample> tint_symbol_8 [[texture(0)]], texture2d<float, access::sample> tint_symbol_9 [[texture(1)]], const constant ExternalTextureParams_tint_packed_vec3* tint_symbol_10 [[buffer(2)]]) {
|
|
float4 const inner_result = vertex_main_inner(tint_symbol_8, tint_symbol_9, tint_symbol_10);
|
|
tint_symbol_1 wrapper_result = {};
|
|
wrapper_result.value = inner_result;
|
|
return wrapper_result;
|
|
}
|
|
|
|
fragment void fragment_main(texture2d<float, access::sample> tint_symbol_11 [[texture(0)]], texture2d<float, access::sample> tint_symbol_12 [[texture(1)]], const constant ExternalTextureParams_tint_packed_vec3* tint_symbol_13 [[buffer(2)]]) {
|
|
doTextureLoad(tint_symbol_11, tint_symbol_12, tint_symbol_13);
|
|
return;
|
|
}
|
|
|
|
kernel void compute_main(texture2d<float, access::sample> tint_symbol_14 [[texture(0)]], texture2d<float, access::sample> tint_symbol_15 [[texture(1)]], const constant ExternalTextureParams_tint_packed_vec3* tint_symbol_16 [[buffer(2)]]) {
|
|
doTextureLoad(tint_symbol_14, tint_symbol_15, tint_symbol_16);
|
|
return;
|
|
}
|
|
|