// Copyright 2017 The NXT Authors // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. #include "backend/CommandBuffer.h" #include "backend/BindGroup.h" #include "backend/Buffer.h" #include "backend/Commands.h" #include "backend/CommandBufferStateTracker.h" #include "backend/ComputePipeline.h" #include "backend/Device.h" #include "backend/InputState.h" #include "backend/PipelineLayout.h" #include "backend/RenderPipeline.h" #include "backend/Texture.h" #include #include namespace backend { namespace { bool ValidateCopyLocationFitsInTexture(CommandBufferBuilder* builder, const TextureCopyLocation& location) { const TextureBase* texture = location.texture.Get(); if (location.level >= texture->GetNumMipLevels()) { builder->HandleError("Copy mip-level out of range"); return false; } // All texture dimensions are in uint32_t so by doing checks in uint64_t we avoid overflows. uint64_t level = location.level; if (uint64_t(location.x) + uint64_t(location.width) > (static_cast(texture->GetWidth()) >> level) || uint64_t(location.y) + uint64_t(location.height) > (static_cast(texture->GetHeight()) >> level)) { builder->HandleError("Copy would touch outside of the texture"); return false; } // TODO(cwallez@chromium.org): Check the depth bound differently for 2D arrays and 3D textures if (location.z != 0 || location.depth != 1) { builder->HandleError("No support for z != 0 and depth != 1 for now"); return false; } return true; } bool FitsInBuffer(const BufferBase* buffer, uint32_t offset, uint32_t size) { uint32_t bufferSize = buffer->GetSize(); return offset <= bufferSize && (size <= (bufferSize - offset)); } bool ValidateCopySizeFitsInBuffer(CommandBufferBuilder* builder, const BufferCopyLocation& location, uint32_t dataSize) { if (!FitsInBuffer(location.buffer.Get(), location.offset, dataSize)) { builder->HandleError("Copy would overflow the buffer"); return false; } return true; } bool ValidateTexelBufferOffset(CommandBufferBuilder* builder, TextureBase* texture, const BufferCopyLocation& location) { uint32_t texelSize = static_cast(TextureFormatPixelSize(texture->GetFormat())); if (location.offset % texelSize != 0) { builder->HandleError("Buffer offset must be a multiple of the texel size"); return false; } return true; } bool ComputeTextureCopyBufferSize(CommandBufferBuilder*, const TextureCopyLocation& location, uint32_t rowPitch, uint32_t* bufferSize) { // TODO(cwallez@chromium.org): check for overflows *bufferSize = (rowPitch * (location.height - 1) + location.width) * location.depth; return true; } uint32_t ComputeDefaultRowPitch(TextureBase* texture, uint32_t width) { uint32_t texelSize = TextureFormatPixelSize(texture->GetFormat()); return texelSize * width; } bool ValidateRowPitch(CommandBufferBuilder* builder, const TextureCopyLocation& location, uint32_t rowPitch) { if (rowPitch % kTextureRowPitchAlignment != 0) { builder->HandleError("Row pitch must be a multiple of 256"); return false; } uint32_t texelSize = TextureFormatPixelSize(location.texture.Get()->GetFormat()); if (rowPitch < location.width * texelSize) { builder->HandleError("Row pitch must not be less than the number of bytes per row"); return false; } return true; } } CommandBufferBase::CommandBufferBase(CommandBufferBuilder* builder) : device(builder->device), buffersTransitioned(std::move(builder->state->buffersTransitioned)), texturesTransitioned(std::move(builder->state->texturesTransitioned)) { } bool CommandBufferBase::ValidateResourceUsagesImmediate() { for (auto buffer : buffersTransitioned) { if (buffer->IsFrozen()) { device->HandleError("Command buffer: cannot transition buffer with frozen usage"); return false; } } for (auto texture : texturesTransitioned) { if (texture->IsFrozen()) { device->HandleError("Command buffer: cannot transition texture with frozen usage"); return false; } } return true; } DeviceBase* CommandBufferBase::GetDevice() { return device; } void FreeCommands(CommandIterator* commands) { Command type; while(commands->NextCommandId(&type)) { switch (type) { case Command::BeginComputePass: { BeginComputePassCmd* begin = commands->NextCommand(); begin->~BeginComputePassCmd(); } break; case Command::BeginRenderPass: { BeginRenderPassCmd* begin = commands->NextCommand(); begin->~BeginRenderPassCmd(); } break; case Command::BeginRenderSubpass: { BeginRenderSubpassCmd* begin = commands->NextCommand(); begin->~BeginRenderSubpassCmd(); } break; case Command::CopyBufferToBuffer: { CopyBufferToBufferCmd* copy = commands->NextCommand(); copy->~CopyBufferToBufferCmd(); } break; case Command::CopyBufferToTexture: { CopyBufferToTextureCmd* copy = commands->NextCommand(); copy->~CopyBufferToTextureCmd(); } break; case Command::CopyTextureToBuffer: { CopyTextureToBufferCmd* copy = commands->NextCommand(); copy->~CopyTextureToBufferCmd(); } break; case Command::Dispatch: { DispatchCmd* dispatch = commands->NextCommand(); dispatch->~DispatchCmd(); } break; case Command::DrawArrays: { DrawArraysCmd* draw = commands->NextCommand(); draw->~DrawArraysCmd(); } break; case Command::DrawElements: { DrawElementsCmd* draw = commands->NextCommand(); draw->~DrawElementsCmd(); } break; case Command::EndComputePass: { EndComputePassCmd* cmd = commands->NextCommand(); cmd->~EndComputePassCmd(); } break; case Command::EndRenderPass: { EndRenderPassCmd* cmd = commands->NextCommand(); cmd->~EndRenderPassCmd(); } break; case Command::EndRenderSubpass: { EndRenderSubpassCmd* cmd = commands->NextCommand(); cmd->~EndRenderSubpassCmd(); } break; case Command::SetComputePipeline: { SetComputePipelineCmd* cmd = commands->NextCommand(); cmd->~SetComputePipelineCmd(); } break; case Command::SetRenderPipeline: { SetRenderPipelineCmd* cmd = commands->NextCommand(); cmd->~SetRenderPipelineCmd(); } break; case Command::SetPushConstants: { SetPushConstantsCmd* cmd = commands->NextCommand(); commands->NextData(cmd->count); cmd->~SetPushConstantsCmd(); } break; case Command::SetStencilReference: { SetStencilReferenceCmd* cmd = commands->NextCommand(); cmd->~SetStencilReferenceCmd(); } break; case Command::SetBindGroup: { SetBindGroupCmd* cmd = commands->NextCommand(); cmd->~SetBindGroupCmd(); } break; case Command::SetIndexBuffer: { SetIndexBufferCmd* cmd = commands->NextCommand(); cmd->~SetIndexBufferCmd(); } break; case Command::SetVertexBuffers: { SetVertexBuffersCmd* cmd = commands->NextCommand(); auto buffers = commands->NextData>(cmd->count); for (size_t i = 0; i < cmd->count; ++i) { (&buffers[i])->~Ref(); } commands->NextData(cmd->count); cmd->~SetVertexBuffersCmd(); } break; case Command::TransitionBufferUsage: { TransitionBufferUsageCmd* cmd = commands->NextCommand(); cmd->~TransitionBufferUsageCmd(); } break; case Command::TransitionTextureUsage: { TransitionTextureUsageCmd* cmd = commands->NextCommand(); cmd->~TransitionTextureUsageCmd(); } break; } } commands->DataWasDestroyed(); } void SkipCommand(CommandIterator* commands, Command type) { switch (type) { case Command::BeginComputePass: commands->NextCommand(); break; case Command::BeginRenderPass: commands->NextCommand(); break; case Command::BeginRenderSubpass: commands->NextCommand(); break; case Command::CopyBufferToBuffer: commands->NextCommand(); break; case Command::CopyBufferToTexture: commands->NextCommand(); break; case Command::CopyTextureToBuffer: commands->NextCommand(); break; case Command::Dispatch: commands->NextCommand(); break; case Command::DrawArrays: commands->NextCommand(); break; case Command::DrawElements: commands->NextCommand(); break; case Command::EndComputePass: commands->NextCommand(); break; case Command::EndRenderPass: commands->NextCommand(); break; case Command::EndRenderSubpass: commands->NextCommand(); break; case Command::SetComputePipeline: commands->NextCommand(); break; case Command::SetRenderPipeline: commands->NextCommand(); break; case Command::SetPushConstants: { auto* cmd = commands->NextCommand(); commands->NextData(cmd->count); } break; case Command::SetStencilReference: commands->NextCommand(); break; case Command::SetBindGroup: commands->NextCommand(); break; case Command::SetIndexBuffer: commands->NextCommand(); break; case Command::SetVertexBuffers: { auto* cmd = commands->NextCommand(); commands->NextData>(cmd->count); commands->NextData(cmd->count); } break; case Command::TransitionBufferUsage: commands->NextCommand(); break; case Command::TransitionTextureUsage: commands->NextCommand(); break; } } CommandBufferBuilder::CommandBufferBuilder(DeviceBase* device) : Builder(device), state(std::make_unique(this)) { } CommandBufferBuilder::~CommandBufferBuilder() { if (!commandsAcquired) { MoveToIterator(); FreeCommands(&iterator); } } bool CommandBufferBuilder::ValidateGetResult() { MoveToIterator(); Command type; while (iterator.NextCommandId(&type)) { switch (type) { case Command::BeginComputePass: { iterator.NextCommand(); if (!state->BeginComputePass()) { return false; } } break; case Command::BeginRenderPass: { BeginRenderPassCmd* cmd = iterator.NextCommand(); auto* renderPass = cmd->renderPass.Get(); auto* framebuffer = cmd->framebuffer.Get(); // TODO(kainino@chromium.org): null checks should not be necessary if (renderPass == nullptr) { HandleError("Render pass is invalid"); return false; } if (framebuffer == nullptr) { HandleError("Framebuffer is invalid"); return false; } if (!state->BeginRenderPass(renderPass, framebuffer)) { return false; } } break; case Command::BeginRenderSubpass: { iterator.NextCommand(); if (!state->BeginSubpass()) { return false; } } break; case Command::CopyBufferToBuffer: { CopyBufferToBufferCmd* copy = iterator.NextCommand(); if (!ValidateCopySizeFitsInBuffer(this, copy->source, copy->size) || !ValidateCopySizeFitsInBuffer(this, copy->destination, copy->size) || !state->ValidateCanCopy() || !state->ValidateCanUseBufferAs(copy->source.buffer.Get(), nxt::BufferUsageBit::TransferSrc) || !state->ValidateCanUseBufferAs(copy->destination.buffer.Get(), nxt::BufferUsageBit::TransferDst)) { return false; } } break; case Command::CopyBufferToTexture: { CopyBufferToTextureCmd* copy = iterator.NextCommand(); uint32_t bufferCopySize = 0; if (!ValidateRowPitch(this, copy->destination, copy->rowPitch) || !ComputeTextureCopyBufferSize(this, copy->destination, copy->rowPitch, &bufferCopySize) || !ValidateCopyLocationFitsInTexture(this, copy->destination) || !ValidateCopySizeFitsInBuffer(this, copy->source, bufferCopySize) || !ValidateTexelBufferOffset(this, copy->destination.texture.Get(), copy->source) || !state->ValidateCanCopy() || !state->ValidateCanUseBufferAs(copy->source.buffer.Get(), nxt::BufferUsageBit::TransferSrc) || !state->ValidateCanUseTextureAs(copy->destination.texture.Get(), nxt::TextureUsageBit::TransferDst)) { return false; } } break; case Command::CopyTextureToBuffer: { CopyTextureToBufferCmd* copy = iterator.NextCommand(); uint32_t bufferCopySize = 0; if (!ValidateRowPitch(this, copy->source, copy->rowPitch) || !ComputeTextureCopyBufferSize(this, copy->source, copy->rowPitch, &bufferCopySize) || !ValidateCopyLocationFitsInTexture(this, copy->source) || !ValidateCopySizeFitsInBuffer(this, copy->destination, bufferCopySize) || !ValidateTexelBufferOffset(this, copy->source.texture.Get(), copy->destination) || !state->ValidateCanCopy() || !state->ValidateCanUseTextureAs(copy->source.texture.Get(), nxt::TextureUsageBit::TransferSrc) || !state->ValidateCanUseBufferAs(copy->destination.buffer.Get(), nxt::BufferUsageBit::TransferDst)) { return false; } } break; case Command::Dispatch: { iterator.NextCommand(); if (!state->ValidateCanDispatch()) { return false; } } break; case Command::DrawArrays: { iterator.NextCommand(); if (!state->ValidateCanDrawArrays()) { return false; } } break; case Command::DrawElements: { iterator.NextCommand(); if (!state->ValidateCanDrawElements()) { return false; } } break; case Command::EndComputePass: { iterator.NextCommand(); if (!state->EndComputePass()) { return false; } } break; case Command::EndRenderPass: { iterator.NextCommand(); if (!state->EndRenderPass()) { return false; } } break; case Command::EndRenderSubpass: { iterator.NextCommand(); if (!state->EndSubpass()) { return false; } } break; case Command::SetComputePipeline: { SetComputePipelineCmd* cmd = iterator.NextCommand(); ComputePipelineBase* pipeline = cmd->pipeline.Get(); if (!state->SetComputePipeline(pipeline)) { return false; } } break; case Command::SetRenderPipeline: { SetRenderPipelineCmd* cmd = iterator.NextCommand(); RenderPipelineBase* pipeline = cmd->pipeline.Get(); if (!state->SetRenderPipeline(pipeline)) { return false; } } break; case Command::SetPushConstants: { SetPushConstantsCmd* cmd = iterator.NextCommand(); iterator.NextData(cmd->count); // Validation of count and offset has already been done when the command was recorded // because it impacts the size of an allocation in the CommandAllocator. if (!state->ValidateSetPushConstants(cmd->stages)) { return false; } } break; case Command::SetStencilReference: { iterator.NextCommand(); if (!state->HaveRenderPass()) { HandleError("Can't set stencil reference without an active render pass"); return false; } } break; case Command::SetBindGroup: { SetBindGroupCmd* cmd = iterator.NextCommand(); if (!state->SetBindGroup(cmd->index, cmd->group.Get())) { return false; } } break; case Command::SetIndexBuffer: { SetIndexBufferCmd* cmd = iterator.NextCommand(); if (!state->SetIndexBuffer(cmd->buffer.Get())) { return false; } } break; case Command::SetVertexBuffers: { SetVertexBuffersCmd* cmd = iterator.NextCommand(); auto buffers = iterator.NextData>(cmd->count); iterator.NextData(cmd->count); for (uint32_t i = 0; i < cmd->count; ++i) { state->SetVertexBuffer(cmd->startSlot + i, buffers[i].Get()); } } break; case Command::TransitionBufferUsage: { TransitionBufferUsageCmd* cmd = iterator.NextCommand(); if (!state->TransitionBufferUsage(cmd->buffer.Get(), cmd->usage)) { return false; } } break; case Command::TransitionTextureUsage: { TransitionTextureUsageCmd* cmd = iterator.NextCommand(); if (!state->TransitionTextureUsage(cmd->texture.Get(), cmd->usage)) { return false; } } break; } } if (!state->ValidateEndCommandBuffer()) { return false; } return true; } CommandIterator CommandBufferBuilder::AcquireCommands() { ASSERT(!commandsAcquired); commandsAcquired = true; return std::move(iterator); } CommandBufferBase* CommandBufferBuilder::GetResultImpl() { MoveToIterator(); return device->CreateCommandBuffer(this); } void CommandBufferBuilder::BeginComputePass() { allocator.Allocate(Command::BeginComputePass); } void CommandBufferBuilder::BeginRenderPass(RenderPassBase* renderPass, FramebufferBase* framebuffer) { BeginRenderPassCmd* cmd = allocator.Allocate(Command::BeginRenderPass); new(cmd) BeginRenderPassCmd; cmd->renderPass = renderPass; cmd->framebuffer = framebuffer; } void CommandBufferBuilder::BeginRenderSubpass() { allocator.Allocate(Command::BeginRenderSubpass); } void CommandBufferBuilder::CopyBufferToBuffer(BufferBase* source, uint32_t sourceOffset, BufferBase* destination, uint32_t destinationOffset, uint32_t size) { CopyBufferToBufferCmd* copy = allocator.Allocate(Command::CopyBufferToBuffer); new(copy) CopyBufferToBufferCmd; copy->source.buffer = source; copy->source.offset = sourceOffset; copy->destination.buffer = destination; copy->destination.offset = destinationOffset; copy->size = size; } void CommandBufferBuilder::CopyBufferToTexture(BufferBase* buffer, uint32_t bufferOffset, uint32_t rowPitch, TextureBase* texture, uint32_t x, uint32_t y, uint32_t z, uint32_t width, uint32_t height, uint32_t depth, uint32_t level) { if (rowPitch == 0) { rowPitch = ComputeDefaultRowPitch(texture, width); } CopyBufferToTextureCmd* copy = allocator.Allocate(Command::CopyBufferToTexture); new(copy) CopyBufferToTextureCmd; copy->source.buffer = buffer; copy->source.offset = bufferOffset; copy->destination.texture = texture; copy->destination.x = x; copy->destination.y = y; copy->destination.z = z; copy->destination.width = width; copy->destination.height = height; copy->destination.depth = depth; copy->destination.level = level; copy->rowPitch = rowPitch; } void CommandBufferBuilder::CopyTextureToBuffer(TextureBase* texture, uint32_t x, uint32_t y, uint32_t z, uint32_t width, uint32_t height, uint32_t depth, uint32_t level, BufferBase* buffer, uint32_t bufferOffset, uint32_t rowPitch) { if (rowPitch == 0) { rowPitch = ComputeDefaultRowPitch(texture, width); } CopyTextureToBufferCmd* copy = allocator.Allocate(Command::CopyTextureToBuffer); new(copy) CopyTextureToBufferCmd; copy->source.texture = texture; copy->source.x = x; copy->source.y = y; copy->source.z = z; copy->source.width = width; copy->source.height = height; copy->source.depth = depth; copy->source.level = level; copy->destination.buffer = buffer; copy->destination.offset = bufferOffset; copy->rowPitch = rowPitch; } void CommandBufferBuilder::Dispatch(uint32_t x, uint32_t y, uint32_t z) { DispatchCmd* dispatch = allocator.Allocate(Command::Dispatch); new(dispatch) DispatchCmd; dispatch->x = x; dispatch->y = y; dispatch->z = z; } void CommandBufferBuilder::DrawArrays(uint32_t vertexCount, uint32_t instanceCount, uint32_t firstVertex, uint32_t firstInstance) { DrawArraysCmd* draw = allocator.Allocate(Command::DrawArrays); new(draw) DrawArraysCmd; draw->vertexCount = vertexCount; draw->instanceCount = instanceCount; draw->firstVertex = firstVertex; draw->firstInstance = firstInstance; } void CommandBufferBuilder::DrawElements(uint32_t indexCount, uint32_t instanceCount, uint32_t firstIndex, uint32_t firstInstance) { DrawElementsCmd* draw = allocator.Allocate(Command::DrawElements); new(draw) DrawElementsCmd; draw->indexCount = indexCount; draw->instanceCount = instanceCount; draw->firstIndex = firstIndex; draw->firstInstance = firstInstance; } void CommandBufferBuilder::EndComputePass() { allocator.Allocate(Command::EndComputePass); } void CommandBufferBuilder::EndRenderPass() { allocator.Allocate(Command::EndRenderPass); } void CommandBufferBuilder::EndRenderSubpass() { allocator.Allocate(Command::EndRenderSubpass); } void CommandBufferBuilder::SetComputePipeline(ComputePipelineBase* pipeline) { SetComputePipelineCmd* cmd = allocator.Allocate(Command::SetComputePipeline); new(cmd) SetComputePipelineCmd; cmd->pipeline = pipeline; } void CommandBufferBuilder::SetRenderPipeline(RenderPipelineBase* pipeline) { SetRenderPipelineCmd* cmd = allocator.Allocate(Command::SetRenderPipeline); new(cmd) SetRenderPipelineCmd; cmd->pipeline = pipeline; } void CommandBufferBuilder::SetPushConstants(nxt::ShaderStageBit stages, uint32_t offset, uint32_t count, const void* data) { // TODO(cwallez@chromium.org): check for overflows if (offset + count > kMaxPushConstants) { HandleError("Setting too many push constants"); return; } SetPushConstantsCmd* cmd = allocator.Allocate(Command::SetPushConstants); new(cmd) SetPushConstantsCmd; cmd->stages = stages; cmd->offset = offset; cmd->count = count; uint32_t* values = allocator.AllocateData(count); memcpy(values, data, count * sizeof(uint32_t)); } void CommandBufferBuilder::SetStencilReference(uint32_t reference) { SetStencilReferenceCmd* cmd = allocator.Allocate(Command::SetStencilReference); new(cmd) SetStencilReferenceCmd; cmd->reference = reference; } void CommandBufferBuilder::SetBindGroup(uint32_t groupIndex, BindGroupBase* group) { if (groupIndex >= kMaxBindGroups) { HandleError("Setting bind group over the max"); return; } SetBindGroupCmd* cmd = allocator.Allocate(Command::SetBindGroup); new(cmd) SetBindGroupCmd; cmd->index = groupIndex; cmd->group = group; } void CommandBufferBuilder::SetIndexBuffer(BufferBase* buffer, uint32_t offset, nxt::IndexFormat format) { // TODO(kainino@chromium.org): validation SetIndexBufferCmd* cmd = allocator.Allocate(Command::SetIndexBuffer); new(cmd) SetIndexBufferCmd; cmd->buffer = buffer; cmd->offset = offset; cmd->format = format; } void CommandBufferBuilder::SetVertexBuffers(uint32_t startSlot, uint32_t count, BufferBase* const* buffers, uint32_t const* offsets){ // TODO(kainino@chromium.org): validation SetVertexBuffersCmd* cmd = allocator.Allocate(Command::SetVertexBuffers); new(cmd) SetVertexBuffersCmd; cmd->startSlot = startSlot; cmd->count = count; Ref* cmdBuffers = allocator.AllocateData>(count); for (size_t i = 0; i < count; ++i) { new(&cmdBuffers[i]) Ref(buffers[i]); } uint32_t* cmdOffsets = allocator.AllocateData(count); memcpy(cmdOffsets, offsets, count * sizeof(uint32_t)); } void CommandBufferBuilder::TransitionBufferUsage(BufferBase* buffer, nxt::BufferUsageBit usage) { TransitionBufferUsageCmd* cmd = allocator.Allocate(Command::TransitionBufferUsage); new(cmd) TransitionBufferUsageCmd; cmd->buffer = buffer; cmd->usage = usage; } void CommandBufferBuilder::TransitionTextureUsage(TextureBase* texture, nxt::TextureUsageBit usage) { TransitionTextureUsageCmd* cmd = allocator.Allocate(Command::TransitionTextureUsage); new(cmd) TransitionTextureUsageCmd; cmd->texture = texture; cmd->usage = usage; } void CommandBufferBuilder::MoveToIterator() { if (!movedToIterator) { iterator = std::move(allocator); movedToIterator = true; } } }