mirror of
https://github.com/encounter/dawn-cmake.git
synced 2025-06-05 06:03:34 +00:00
Bug: none Change-Id: I9d48951019f5e1cfeca3815245a8818d79c3d1da Reviewed-on: https://dawn-review.googlesource.com/c/dawn/+/68282 Reviewed-by: Corentin Wallez <cwallez@chromium.org> Reviewed-by: Loko Kung <lokokung@google.com> Commit-Queue: Austin Eng <enga@chromium.org>
188 lines
7.7 KiB
C++
188 lines
7.7 KiB
C++
// Copyright 2020 The Dawn Authors
|
|
//
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
// you may not use this file except in compliance with the License.
|
|
// You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
|
|
#include "dawn_native/QueryHelper.h"
|
|
|
|
#include "dawn_native/BindGroup.h"
|
|
#include "dawn_native/BindGroupLayout.h"
|
|
#include "dawn_native/Buffer.h"
|
|
#include "dawn_native/CommandEncoder.h"
|
|
#include "dawn_native/ComputePassEncoder.h"
|
|
#include "dawn_native/ComputePipeline.h"
|
|
#include "dawn_native/Device.h"
|
|
#include "dawn_native/InternalPipelineStore.h"
|
|
#include "dawn_native/utils/WGPUHelpers.h"
|
|
|
|
namespace dawn_native {
|
|
|
|
namespace {
|
|
|
|
// Assert the offsets in dawn_native::TimestampParams are same with the ones in the shader
|
|
static_assert(offsetof(dawn_native::TimestampParams, first) == 0, "");
|
|
static_assert(offsetof(dawn_native::TimestampParams, count) == 4, "");
|
|
static_assert(offsetof(dawn_native::TimestampParams, offset) == 8, "");
|
|
static_assert(offsetof(dawn_native::TimestampParams, period) == 12, "");
|
|
|
|
static const char sConvertTimestampsToNanoseconds[] = R"(
|
|
struct Timestamp {
|
|
low : u32;
|
|
high : u32;
|
|
};
|
|
|
|
[[block]] struct TimestampArr {
|
|
t : array<Timestamp>;
|
|
};
|
|
|
|
[[block]] struct AvailabilityArr {
|
|
v : array<u32>;
|
|
};
|
|
|
|
[[block]] struct TimestampParams {
|
|
first : u32;
|
|
count : u32;
|
|
offset : u32;
|
|
period : f32;
|
|
};
|
|
|
|
[[group(0), binding(0)]]
|
|
var<storage, read_write> timestamps : TimestampArr;
|
|
[[group(0), binding(1)]]
|
|
var<storage, read> availability : AvailabilityArr;
|
|
[[group(0), binding(2)]] var<uniform> params : TimestampParams;
|
|
|
|
|
|
let sizeofTimestamp : u32 = 8u;
|
|
|
|
[[stage(compute), workgroup_size(8, 1, 1)]]
|
|
fn main([[builtin(global_invocation_id)]] GlobalInvocationID : vec3<u32>) {
|
|
if (GlobalInvocationID.x >= params.count) { return; }
|
|
|
|
var index = GlobalInvocationID.x + params.offset / sizeofTimestamp;
|
|
|
|
var timestamp = timestamps.t[index];
|
|
|
|
// Return 0 for the unavailable value.
|
|
if (availability.v[GlobalInvocationID.x + params.first] == 0u) {
|
|
timestamps.t[index].low = 0u;
|
|
timestamps.t[index].high = 0u;
|
|
return;
|
|
}
|
|
|
|
// Multiply the values in timestamps buffer by the period.
|
|
var period = params.period;
|
|
var w = 0u;
|
|
|
|
// If the product of low 32-bits and the period does not exceed the maximum of u32,
|
|
// directly do the multiplication, otherwise, use two u32 to represent the high
|
|
// 16-bits and low 16-bits of this u32, then multiply them by the period separately.
|
|
if (timestamp.low <= u32(f32(0xFFFFFFFFu) / period)) {
|
|
timestamps.t[index].low = u32(round(f32(timestamp.low) * period));
|
|
} else {
|
|
var lo = timestamp.low & 0xFFFFu;
|
|
var hi = timestamp.low >> 16u;
|
|
|
|
var t0 = u32(round(f32(lo) * period));
|
|
var t1 = u32(round(f32(hi) * period)) + (t0 >> 16u);
|
|
w = t1 >> 16u;
|
|
|
|
var result = t1 << 16u;
|
|
result = result | (t0 & 0xFFFFu);
|
|
timestamps.t[index].low = result;
|
|
}
|
|
|
|
// Get the nearest integer to the float result. For high 32-bits, the round
|
|
// function will greatly help reduce the accuracy loss of the final result.
|
|
timestamps.t[index].high = u32(round(f32(timestamp.high) * period)) + w;
|
|
}
|
|
)";
|
|
|
|
ResultOrError<ComputePipelineBase*> GetOrCreateTimestampComputePipeline(
|
|
DeviceBase* device) {
|
|
InternalPipelineStore* store = device->GetInternalPipelineStore();
|
|
|
|
if (store->timestampComputePipeline == nullptr) {
|
|
// Create compute shader module if not cached before.
|
|
if (store->timestampCS == nullptr) {
|
|
DAWN_TRY_ASSIGN(
|
|
store->timestampCS,
|
|
utils::CreateShaderModule(device, sConvertTimestampsToNanoseconds));
|
|
}
|
|
|
|
// Create binding group layout
|
|
Ref<BindGroupLayoutBase> bgl;
|
|
DAWN_TRY_ASSIGN(
|
|
bgl, utils::MakeBindGroupLayout(
|
|
device,
|
|
{
|
|
{0, wgpu::ShaderStage::Compute, kInternalStorageBufferBinding},
|
|
{1, wgpu::ShaderStage::Compute,
|
|
wgpu::BufferBindingType::ReadOnlyStorage},
|
|
{2, wgpu::ShaderStage::Compute, wgpu::BufferBindingType::Uniform},
|
|
},
|
|
/* allowInternalBinding */ true));
|
|
|
|
// Create pipeline layout
|
|
Ref<PipelineLayoutBase> layout;
|
|
DAWN_TRY_ASSIGN(layout, utils::MakeBasicPipelineLayout(device, bgl));
|
|
|
|
// Create ComputePipeline.
|
|
ComputePipelineDescriptor computePipelineDesc = {};
|
|
// Generate the layout based on shader module.
|
|
computePipelineDesc.layout = layout.Get();
|
|
computePipelineDesc.compute.module = store->timestampCS.Get();
|
|
computePipelineDesc.compute.entryPoint = "main";
|
|
|
|
DAWN_TRY_ASSIGN(store->timestampComputePipeline,
|
|
device->CreateComputePipeline(&computePipelineDesc));
|
|
}
|
|
|
|
return store->timestampComputePipeline.Get();
|
|
}
|
|
|
|
} // anonymous namespace
|
|
|
|
MaybeError EncodeConvertTimestampsToNanoseconds(CommandEncoder* encoder,
|
|
BufferBase* timestamps,
|
|
BufferBase* availability,
|
|
BufferBase* params) {
|
|
DeviceBase* device = encoder->GetDevice();
|
|
|
|
ComputePipelineBase* pipeline;
|
|
DAWN_TRY_ASSIGN(pipeline, GetOrCreateTimestampComputePipeline(device));
|
|
|
|
// Prepare bind group layout.
|
|
Ref<BindGroupLayoutBase> layout;
|
|
DAWN_TRY_ASSIGN(layout, pipeline->GetBindGroupLayout(0));
|
|
|
|
// Create bind group after all binding entries are set.
|
|
Ref<BindGroupBase> bindGroup;
|
|
DAWN_TRY_ASSIGN(bindGroup,
|
|
utils::MakeBindGroup(device, layout,
|
|
{{0, timestamps}, {1, availability}, {2, params}}));
|
|
|
|
// Create compute encoder and issue dispatch.
|
|
ComputePassDescriptor passDesc = {};
|
|
// TODO(dawn:723): change to not use AcquireRef for reentrant object creation.
|
|
Ref<ComputePassEncoder> pass = AcquireRef(encoder->APIBeginComputePass(&passDesc));
|
|
pass->APISetPipeline(pipeline);
|
|
pass->APISetBindGroup(0, bindGroup.Get());
|
|
pass->APIDispatch(
|
|
static_cast<uint32_t>((timestamps->GetSize() / sizeof(uint64_t) + 7) / 8));
|
|
pass->APIEndPass();
|
|
|
|
return {};
|
|
}
|
|
|
|
} // namespace dawn_native
|