mirror of
				https://github.com/encounter/dawn-cmake.git
				synced 2025-10-25 03:00:29 +00:00 
			
		
		
		
	Pipeline cache D3D12 backend impl
Add D3D12 pipeline caching impl: store cachedPSO blob in cached blob. Record root signature ID3DBlob in cache key together with D3D_SHADER_BYTECODE, D3D12_GRAPHICS_PIPELINE_STATE_DESC or D3D12_COMPUTE_PIPELINE_STATE_DESC. Shader caching is not added. Add some pipeline caching negative tests. Bug: dawn:549 Change-Id: Id1cb560b49f1cf495860e2e0bcf92d8d988c5379 Reviewed-on: https://dawn-review.googlesource.com/c/dawn/+/91180 Auto-Submit: Shrek Shao <shrekshao@google.com> Kokoro: Kokoro <noreply+kokoro@google.com> Reviewed-by: Austin Eng <enga@chromium.org> Reviewed-by: Loko Kung <lokokung@google.com> Commit-Queue: Austin Eng <enga@chromium.org>
This commit is contained in:
		
							parent
							
								
									c0af5c5c9c
								
							
						
					
					
						commit
						4313dba514
					
				
							
								
								
									
										2
									
								
								.gitattributes
									
									
									
									
										vendored
									
									
								
							
							
						
						
									
										2
									
								
								.gitattributes
									
									
									
									
										vendored
									
									
								
							| @ -7,3 +7,5 @@ | ||||
| *.sh     eol=lf | ||||
| *.spvasm eol=lf | ||||
| *.wgsl   eol=lf | ||||
| *.h      eol=lf | ||||
| *.cpp    eol=lf | ||||
| @ -378,6 +378,7 @@ source_set("sources") { | ||||
|       "d3d12/BufferD3D12.h", | ||||
|       "d3d12/CPUDescriptorHeapAllocationD3D12.cpp", | ||||
|       "d3d12/CPUDescriptorHeapAllocationD3D12.h", | ||||
|       "d3d12/CacheKeyD3D12.cpp", | ||||
|       "d3d12/CommandAllocatorManager.cpp", | ||||
|       "d3d12/CommandAllocatorManager.h", | ||||
|       "d3d12/CommandBufferD3D12.cpp", | ||||
| @ -406,6 +407,7 @@ source_set("sources") { | ||||
|       "d3d12/NativeSwapChainImplD3D12.h", | ||||
|       "d3d12/PageableD3D12.cpp", | ||||
|       "d3d12/PageableD3D12.h", | ||||
|       "d3d12/PipelineCacheD3D12.cpp", | ||||
|       "d3d12/PipelineLayoutD3D12.cpp", | ||||
|       "d3d12/PipelineLayoutD3D12.h", | ||||
|       "d3d12/PlatformFunctions.cpp", | ||||
|  | ||||
| @ -21,39 +21,47 @@ | ||||
| 
 | ||||
| namespace dawn::native { | ||||
| 
 | ||||
| CachedBlob::CachedBlob(size_t size) { | ||||
|     if (size != 0) { | ||||
|         Reset(size); | ||||
| // static
 | ||||
| CachedBlob CachedBlob::Create(size_t size) { | ||||
|     if (size > 0) { | ||||
|         uint8_t* data = new uint8_t[size]; | ||||
|         return CachedBlob(data, size, [=]() { delete[] data; }); | ||||
|     } else { | ||||
|         return CachedBlob(); | ||||
|     } | ||||
| } | ||||
| 
 | ||||
| CachedBlob::CachedBlob() : mData(nullptr), mSize(0), mDeleter({}) {} | ||||
| 
 | ||||
| CachedBlob::CachedBlob(uint8_t* data, size_t size, std::function<void()> deleter) | ||||
|     : mData(data), mSize(size), mDeleter(deleter) {} | ||||
| 
 | ||||
| CachedBlob::CachedBlob(CachedBlob&&) = default; | ||||
| 
 | ||||
| CachedBlob::~CachedBlob() = default; | ||||
| 
 | ||||
| CachedBlob& CachedBlob::operator=(CachedBlob&&) = default; | ||||
| 
 | ||||
| CachedBlob::~CachedBlob() { | ||||
|     if (mDeleter) { | ||||
|         mDeleter(); | ||||
|     } | ||||
| } | ||||
| 
 | ||||
| bool CachedBlob::Empty() const { | ||||
|     return mSize == 0; | ||||
| } | ||||
| 
 | ||||
| const uint8_t* CachedBlob::Data() const { | ||||
|     return mData.get(); | ||||
|     return mData; | ||||
| } | ||||
| 
 | ||||
| uint8_t* CachedBlob::Data() { | ||||
|     return mData.get(); | ||||
|     return mData; | ||||
| } | ||||
| 
 | ||||
| size_t CachedBlob::Size() const { | ||||
|     return mSize; | ||||
| } | ||||
| 
 | ||||
| void CachedBlob::Reset(size_t size) { | ||||
|     mSize = size; | ||||
|     mData = std::make_unique<uint8_t[]>(size); | ||||
| } | ||||
| 
 | ||||
| BlobCache::BlobCache(dawn::platform::CachingInterface* cachingInterface) | ||||
|     : mCache(cachingInterface) {} | ||||
| 
 | ||||
| @ -72,19 +80,20 @@ void BlobCache::Store(const CacheKey& key, const CachedBlob& value) { | ||||
| } | ||||
| 
 | ||||
| CachedBlob BlobCache::LoadInternal(const CacheKey& key) { | ||||
|     CachedBlob result; | ||||
|     if (mCache == nullptr) { | ||||
|         return result; | ||||
|         return CachedBlob(); | ||||
|     } | ||||
|     const size_t expectedSize = mCache->LoadData(key.data(), key.size(), nullptr, 0); | ||||
|     if (expectedSize > 0) { | ||||
|         result.Reset(expectedSize); | ||||
|         // Need to put this inside to trigger copy elision.
 | ||||
|         CachedBlob result = CachedBlob::Create(expectedSize); | ||||
|         const size_t actualSize = | ||||
|             mCache->LoadData(key.data(), key.size(), result.Data(), expectedSize); | ||||
|         ASSERT(expectedSize == actualSize); | ||||
|     } | ||||
|         return result; | ||||
|     } | ||||
|     return CachedBlob(); | ||||
| } | ||||
| 
 | ||||
| void BlobCache::StoreInternal(const CacheKey& key, size_t valueSize, const void* value) { | ||||
|     ASSERT(value != nullptr); | ||||
|  | ||||
| @ -15,9 +15,16 @@ | ||||
| #ifndef SRC_DAWN_NATIVE_BLOBCACHE_H_ | ||||
| #define SRC_DAWN_NATIVE_BLOBCACHE_H_ | ||||
| 
 | ||||
| #include <functional> | ||||
| #include <memory> | ||||
| #include <mutex> | ||||
| 
 | ||||
| #include "dawn/common/Platform.h" | ||||
| 
 | ||||
| #if defined(DAWN_PLATFORM_WINDOWS) | ||||
| #include "dawn/native/d3d12/d3d12_platform.h" | ||||
| #endif  // DAWN_PLATFORM_WINDOWS
 | ||||
| 
 | ||||
| namespace dawn::platform { | ||||
| class CachingInterface; | ||||
| } | ||||
| @ -30,21 +37,34 @@ class InstanceBase; | ||||
| 
 | ||||
| class CachedBlob { | ||||
|   public: | ||||
|     explicit CachedBlob(size_t size = 0); | ||||
|     CachedBlob(CachedBlob&&); | ||||
|     ~CachedBlob(); | ||||
|     static CachedBlob Create(size_t size); | ||||
| 
 | ||||
| #if defined(DAWN_PLATFORM_WINDOWS) | ||||
|     static CachedBlob Create(Microsoft::WRL::ComPtr<ID3DBlob> blob); | ||||
| #endif  // DAWN_PLATFORM_WINDOWS
 | ||||
| 
 | ||||
|     CachedBlob(const CachedBlob&) = delete; | ||||
|     CachedBlob& operator=(const CachedBlob&) = delete; | ||||
| 
 | ||||
|     CachedBlob(CachedBlob&&); | ||||
|     CachedBlob& operator=(CachedBlob&&); | ||||
| 
 | ||||
|     ~CachedBlob(); | ||||
| 
 | ||||
|     bool Empty() const; | ||||
|     const uint8_t* Data() const; | ||||
|     uint8_t* Data(); | ||||
|     size_t Size() const; | ||||
|     void Reset(size_t size); | ||||
| 
 | ||||
|     CachedBlob(); | ||||
| 
 | ||||
|   private: | ||||
|     std::unique_ptr<uint8_t[]> mData = nullptr; | ||||
|     size_t mSize = 0; | ||||
|     explicit CachedBlob(uint8_t* data, size_t size, std::function<void()> deleter); | ||||
| 
 | ||||
|     uint8_t* mData; | ||||
|     size_t mSize; | ||||
|     std::function<void()> mDeleter; | ||||
| }; | ||||
| 
 | ||||
| // This class should always be thread-safe because it may be called asynchronously. Its purpose
 | ||||
|  | ||||
| @ -247,6 +247,7 @@ if (DAWN_ENABLE_D3D12) | ||||
|         "d3d12/CPUDescriptorHeapAllocationD3D12.h" | ||||
|         "d3d12/CommandAllocatorManager.cpp" | ||||
|         "d3d12/CommandAllocatorManager.h" | ||||
|         "d3d12/CacheKeyD3D12.cpp" | ||||
|         "d3d12/CommandBufferD3D12.cpp" | ||||
|         "d3d12/CommandBufferD3D12.h" | ||||
|         "d3d12/CommandRecordingContext.cpp" | ||||
| @ -273,6 +274,7 @@ if (DAWN_ENABLE_D3D12) | ||||
|         "d3d12/NativeSwapChainImplD3D12.h" | ||||
|         "d3d12/PageableD3D12.cpp" | ||||
|         "d3d12/PageableD3D12.h" | ||||
|         "d3d12/PipelineCacheD3D12.cpp" | ||||
|         "d3d12/PipelineLayoutD3D12.cpp" | ||||
|         "d3d12/PipelineLayoutD3D12.h" | ||||
|         "d3d12/PlatformFunctions.cpp" | ||||
|  | ||||
| @ -628,6 +628,23 @@ BlobCache* DeviceBase::GetBlobCache() { | ||||
|     return nullptr; | ||||
| } | ||||
| 
 | ||||
| CachedBlob DeviceBase::LoadCachedBlob(const CacheKey& key) { | ||||
|     BlobCache* blobCache = GetBlobCache(); | ||||
|     if (!blobCache) { | ||||
|         return CachedBlob(); | ||||
|     } | ||||
|     return blobCache->Load(key); | ||||
| } | ||||
| 
 | ||||
| void DeviceBase::StoreCachedBlob(const CacheKey& key, const CachedBlob& blob) { | ||||
|     if (!blob.Empty()) { | ||||
|         BlobCache* blobCache = GetBlobCache(); | ||||
|         if (blobCache) { | ||||
|             blobCache->Store(key, blob); | ||||
|         } | ||||
|     } | ||||
| } | ||||
| 
 | ||||
| MaybeError DeviceBase::ValidateObject(const ApiObjectBase* object) const { | ||||
|     ASSERT(object != nullptr); | ||||
|     DAWN_INVALID_IF(object->GetDevice() != this, | ||||
|  | ||||
| @ -22,6 +22,7 @@ | ||||
| #include <utility> | ||||
| #include <vector> | ||||
| 
 | ||||
| #include "dawn/native/BlobCache.h" | ||||
| #include "dawn/native/CacheKey.h" | ||||
| #include "dawn/native/Commands.h" | ||||
| #include "dawn/native/ComputePipeline.h" | ||||
| @ -47,7 +48,6 @@ namespace dawn::native { | ||||
| class AsyncTaskManager; | ||||
| class AttachmentState; | ||||
| class AttachmentStateBlueprint; | ||||
| class BlobCache; | ||||
| class CallbackTaskManager; | ||||
| class DynamicUploader; | ||||
| class ErrorScopeStack; | ||||
| @ -284,6 +284,8 @@ class DeviceBase : public RefCountedWithExternalCount { | ||||
|     MaybeError ValidateIsAlive() const; | ||||
| 
 | ||||
|     BlobCache* GetBlobCache(); | ||||
|     CachedBlob LoadCachedBlob(const CacheKey& key); | ||||
|     void StoreCachedBlob(const CacheKey& key, const CachedBlob& blob); | ||||
| 
 | ||||
|     virtual ResultOrError<std::unique_ptr<StagingBufferBase>> CreateStagingBuffer(size_t size) = 0; | ||||
|     virtual MaybeError CopyFromStagingToBuffer(StagingBufferBase* source, | ||||
|  | ||||
| @ -38,7 +38,7 @@ MaybeError PipelineCacheBase::Flush() { | ||||
|     } | ||||
|     // Try to write the data out to the persistent cache.
 | ||||
|     CachedBlob blob; | ||||
|     DAWN_TRY_ASSIGN(blob, SerializeToBlobImpl()); | ||||
|     DAWN_TRY(SerializeToBlobImpl(&blob)); | ||||
|     if (blob.Size() > 0) { | ||||
|         // Using a simple heuristic to decide whether to write out the blob right now. May need
 | ||||
|         // smarter tracking when we are dealing with monolithic caches.
 | ||||
|  | ||||
| @ -45,9 +45,10 @@ class PipelineCacheBase : public RefCounted { | ||||
|     CachedBlob Initialize(); | ||||
| 
 | ||||
|   private: | ||||
|     // Backend implementation of serialization of the cache into a blob. Note that an empty
 | ||||
|     // blob may be returned.
 | ||||
|     virtual ResultOrError<CachedBlob> SerializeToBlobImpl() = 0; | ||||
|     // Backend implementation of serialization of the cache into a blob.
 | ||||
|     // Note: given that no local cached blob should be destructed and copy elision has strict
 | ||||
|     // requirement cached blob is passed in as a pointer to be assigned.
 | ||||
|     virtual MaybeError SerializeToBlobImpl(CachedBlob* blob) = 0; | ||||
| 
 | ||||
|     // The blob cache is owned by the Adapter and pipeline caches are owned/created by devices
 | ||||
|     // or adapters. Since the device owns a reference to the Instance which owns the Adapter,
 | ||||
|  | ||||
							
								
								
									
										139
									
								
								src/dawn/native/d3d12/CacheKeyD3D12.cpp
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										139
									
								
								src/dawn/native/d3d12/CacheKeyD3D12.cpp
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,139 @@ | ||||
| // Copyright 2022 The Dawn Authors
 | ||||
| //
 | ||||
| // Licensed under the Apache License, Version 2.0 (the "License");
 | ||||
| // you may not use this file except in compliance with the License.
 | ||||
| // You may obtain a copy of the License at
 | ||||
| //
 | ||||
| //     http://www.apache.org/licenses/LICENSE-2.0
 | ||||
| //
 | ||||
| // Unless required by applicable law or agreed to in writing, software
 | ||||
| // distributed under the License is distributed on an "AS IS" BASIS,
 | ||||
| // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 | ||||
| // See the License for the specific language governing permissions and
 | ||||
| // limitations under the License.
 | ||||
| 
 | ||||
| #include "dawn/common/Assert.h" | ||||
| #include "dawn/common/Constants.h" | ||||
| #include "dawn/native/CacheKey.h" | ||||
| #include "dawn/native/d3d12/d3d12_platform.h" | ||||
| 
 | ||||
| namespace dawn::native { | ||||
| 
 | ||||
| template <> | ||||
| void CacheKeySerializer<D3D12_COMPUTE_PIPELINE_STATE_DESC>::Serialize( | ||||
|     CacheKey* key, | ||||
|     const D3D12_COMPUTE_PIPELINE_STATE_DESC& t) { | ||||
|     // Don't record pRootSignature as we already record the signature blob in pipline layout.
 | ||||
|     key->Record(t.CS).Record(t.NodeMask).Record(t.Flags); | ||||
| } | ||||
| 
 | ||||
| template <> | ||||
| void CacheKeySerializer<D3D12_RENDER_TARGET_BLEND_DESC>::Serialize( | ||||
|     CacheKey* key, | ||||
|     const D3D12_RENDER_TARGET_BLEND_DESC& t) { | ||||
|     key->Record(t.BlendEnable, t.LogicOpEnable, t.SrcBlend, t.DestBlend, t.BlendOp, t.SrcBlendAlpha, | ||||
|                 t.DestBlendAlpha, t.BlendOpAlpha, t.LogicOp, t.RenderTargetWriteMask); | ||||
| } | ||||
| 
 | ||||
| template <> | ||||
| void CacheKeySerializer<D3D12_BLEND_DESC>::Serialize(CacheKey* key, const D3D12_BLEND_DESC& t) { | ||||
|     key->Record(t.AlphaToCoverageEnable, t.IndependentBlendEnable).Record(t.RenderTarget); | ||||
| } | ||||
| 
 | ||||
| template <> | ||||
| void CacheKeySerializer<D3D12_DEPTH_STENCILOP_DESC>::Serialize( | ||||
|     CacheKey* key, | ||||
|     const D3D12_DEPTH_STENCILOP_DESC& t) { | ||||
|     key->Record(t.StencilFailOp, t.StencilDepthFailOp, t.StencilPassOp, t.StencilFunc); | ||||
| } | ||||
| 
 | ||||
| template <> | ||||
| void CacheKeySerializer<D3D12_DEPTH_STENCIL_DESC>::Serialize(CacheKey* key, | ||||
|                                                              const D3D12_DEPTH_STENCIL_DESC& t) { | ||||
|     key->Record(t.DepthEnable, t.DepthWriteMask, t.DepthFunc, t.StencilEnable, t.StencilReadMask, | ||||
|                 t.StencilWriteMask, t.FrontFace, t.BackFace); | ||||
| } | ||||
| 
 | ||||
| template <> | ||||
| void CacheKeySerializer<D3D12_RASTERIZER_DESC>::Serialize(CacheKey* key, | ||||
|                                                           const D3D12_RASTERIZER_DESC& t) { | ||||
|     key->Record(t.FillMode, t.CullMode, t.FrontCounterClockwise, t.DepthBias, t.DepthBiasClamp, | ||||
|                 t.SlopeScaledDepthBias, t.DepthClipEnable, t.MultisampleEnable, | ||||
|                 t.AntialiasedLineEnable, t.ForcedSampleCount, t.ConservativeRaster); | ||||
| } | ||||
| 
 | ||||
| template <> | ||||
| void CacheKeySerializer<D3D12_INPUT_ELEMENT_DESC>::Serialize(CacheKey* key, | ||||
|                                                              const D3D12_INPUT_ELEMENT_DESC& t) { | ||||
|     key->Record(t.SemanticName, t.SemanticIndex, t.Format, t.InputSlot, t.AlignedByteOffset, | ||||
|                 t.InputSlotClass, t.InstanceDataStepRate); | ||||
| } | ||||
| 
 | ||||
| template <> | ||||
| void CacheKeySerializer<D3D12_INPUT_LAYOUT_DESC>::Serialize(CacheKey* key, | ||||
|                                                             const D3D12_INPUT_LAYOUT_DESC& t) { | ||||
|     key->RecordIterable(t.pInputElementDescs, t.NumElements); | ||||
| } | ||||
| 
 | ||||
| template <> | ||||
| void CacheKeySerializer<D3D12_SO_DECLARATION_ENTRY>::Serialize( | ||||
|     CacheKey* key, | ||||
|     const D3D12_SO_DECLARATION_ENTRY& t) { | ||||
|     key->Record(t.Stream, t.SemanticName, t.SemanticIndex, t.StartComponent, t.ComponentCount, | ||||
|                 t.OutputSlot); | ||||
| } | ||||
| 
 | ||||
| template <> | ||||
| void CacheKeySerializer<D3D12_STREAM_OUTPUT_DESC>::Serialize(CacheKey* key, | ||||
|                                                              const D3D12_STREAM_OUTPUT_DESC& t) { | ||||
|     key->RecordIterable(t.pSODeclaration, t.NumEntries) | ||||
|         .RecordIterable(t.pBufferStrides, t.NumStrides) | ||||
|         .Record(t.RasterizedStream); | ||||
| } | ||||
| 
 | ||||
| template <> | ||||
| void CacheKeySerializer<DXGI_SAMPLE_DESC>::Serialize(CacheKey* key, const DXGI_SAMPLE_DESC& t) { | ||||
|     key->Record(t.Count, t.Quality); | ||||
| } | ||||
| 
 | ||||
| template <> | ||||
| void CacheKeySerializer<D3D12_SHADER_BYTECODE>::Serialize(CacheKey* key, | ||||
|                                                           const D3D12_SHADER_BYTECODE& t) { | ||||
|     key->RecordIterable(reinterpret_cast<const uint8_t*>(t.pShaderBytecode), t.BytecodeLength); | ||||
| } | ||||
| 
 | ||||
| template <> | ||||
| void CacheKeySerializer<D3D12_GRAPHICS_PIPELINE_STATE_DESC>::Serialize( | ||||
|     CacheKey* key, | ||||
|     const D3D12_GRAPHICS_PIPELINE_STATE_DESC& t) { | ||||
|     // Don't record pRootSignature as we already record the signature blob in pipline layout.
 | ||||
|     // Don't record CachedPSO as it is in the cached blob.
 | ||||
|     key->Record(t.VS) | ||||
|         .Record(t.PS) | ||||
|         .Record(t.DS) | ||||
|         .Record(t.HS) | ||||
|         .Record(t.GS) | ||||
|         .Record(t.StreamOutput) | ||||
|         .Record(t.BlendState) | ||||
|         .Record(t.SampleMask) | ||||
|         .Record(t.RasterizerState) | ||||
|         .Record(t.DepthStencilState) | ||||
|         .Record(t.InputLayout) | ||||
|         .Record(t.IBStripCutValue) | ||||
|         .Record(t.PrimitiveTopologyType) | ||||
|         .RecordIterable(t.RTVFormats, t.NumRenderTargets) | ||||
|         .Record(t.DSVFormat) | ||||
|         .Record(t.SampleDesc) | ||||
|         .Record(t.NodeMask) | ||||
|         .Record(t.Flags); | ||||
| } | ||||
| 
 | ||||
| template <> | ||||
| void CacheKeySerializer<ID3DBlob>::Serialize(CacheKey* key, const ID3DBlob& t) { | ||||
|     // Workaround: GetBufferPointer and GetbufferSize are not marked as const
 | ||||
|     ID3DBlob* pBlob = const_cast<ID3DBlob*>(&t); | ||||
|     key->RecordIterable(reinterpret_cast<uint8_t*>(pBlob->GetBufferPointer()), | ||||
|                         pBlob->GetBufferSize()); | ||||
| } | ||||
| 
 | ||||
| }  // namespace dawn::native
 | ||||
| @ -55,15 +55,36 @@ MaybeError ComputePipeline::Initialize() { | ||||
|     D3D12_COMPUTE_PIPELINE_STATE_DESC d3dDesc = {}; | ||||
|     d3dDesc.pRootSignature = ToBackend(GetLayout())->GetRootSignature(); | ||||
| 
 | ||||
|     // TODO(dawn:549): Compile shader everytime before we implement compiled shader cache
 | ||||
|     CompiledShader compiledShader; | ||||
|     DAWN_TRY_ASSIGN(compiledShader, module->Compile(computeStage, SingleShaderStage::Compute, | ||||
|                                                     ToBackend(GetLayout()), compileFlags)); | ||||
|     d3dDesc.CS = compiledShader.GetD3D12ShaderBytecode(); | ||||
| 
 | ||||
|     mCacheKey.Record(d3dDesc, ToBackend(GetLayout())->GetRootSignatureBlob()); | ||||
| 
 | ||||
|     // Try to see if we have anything in the blob cache.
 | ||||
|     CachedBlob blob = device->LoadCachedBlob(GetCacheKey()); | ||||
|     const bool cacheHit = !blob.Empty(); | ||||
|     if (cacheHit) { | ||||
|         // Cache hits, attach cached blob to descriptor.
 | ||||
|         d3dDesc.CachedPSO.pCachedBlob = blob.Data(); | ||||
|         d3dDesc.CachedPSO.CachedBlobSizeInBytes = blob.Size(); | ||||
|     } | ||||
| 
 | ||||
|     auto* d3d12Device = device->GetD3D12Device(); | ||||
|     DAWN_TRY(CheckHRESULT( | ||||
|         d3d12Device->CreateComputePipelineState(&d3dDesc, IID_PPV_ARGS(&mPipelineState)), | ||||
|         "D3D12 creating pipeline state")); | ||||
| 
 | ||||
|     if (!cacheHit) { | ||||
|         // Cache misses, need to get pipeline cached blob and store.
 | ||||
|         ComPtr<ID3DBlob> d3dBlob; | ||||
|         DAWN_TRY(CheckHRESULT(GetPipelineState()->GetCachedBlob(&d3dBlob), | ||||
|                               "D3D12 compute pipeline state get cached blob")); | ||||
|         device->StoreCachedBlob(GetCacheKey(), CachedBlob::Create(std::move(d3dBlob))); | ||||
|     } | ||||
| 
 | ||||
|     SetLabelImpl(); | ||||
| 
 | ||||
|     return {}; | ||||
|  | ||||
| @ -441,6 +441,9 @@ ResultOrError<Ref<TextureViewBase>> Device::CreateTextureViewImpl( | ||||
|     const TextureViewDescriptor* descriptor) { | ||||
|     return TextureView::Create(texture, descriptor); | ||||
| } | ||||
| Ref<PipelineCacheBase> Device::GetOrCreatePipelineCacheImpl(const CacheKey& key) { | ||||
|     UNREACHABLE(); | ||||
| } | ||||
| void Device::InitializeComputePipelineAsyncImpl(Ref<ComputePipelineBase> computePipeline, | ||||
|                                                 WGPUCreateComputePipelineAsyncCallback callback, | ||||
|                                                 void* userdata) { | ||||
|  | ||||
| @ -188,6 +188,7 @@ class Device final : public DeviceBase { | ||||
|         const ComputePipelineDescriptor* descriptor) override; | ||||
|     Ref<RenderPipelineBase> CreateUninitializedRenderPipelineImpl( | ||||
|         const RenderPipelineDescriptor* descriptor) override; | ||||
|     Ref<PipelineCacheBase> GetOrCreatePipelineCacheImpl(const CacheKey& key) override; | ||||
|     void InitializeComputePipelineAsyncImpl(Ref<ComputePipelineBase> computePipeline, | ||||
|                                             WGPUCreateComputePipelineAsyncCallback callback, | ||||
|                                             void* userdata) override; | ||||
|  | ||||
| @ -27,6 +27,7 @@ class CommandBuffer; | ||||
| class ComputePipeline; | ||||
| class Device; | ||||
| class Heap; | ||||
| class PipelineCache; | ||||
| class PipelineLayout; | ||||
| class QuerySet; | ||||
| class Queue; | ||||
| @ -46,6 +47,7 @@ struct D3D12BackendTraits { | ||||
|     using CommandBufferType = CommandBuffer; | ||||
|     using ComputePipelineType = ComputePipeline; | ||||
|     using DeviceType = Device; | ||||
|     using PipelineCacheType = PipelineCache; | ||||
|     using PipelineLayoutType = PipelineLayout; | ||||
|     using QuerySetType = QuerySet; | ||||
|     using QueueType = Queue; | ||||
|  | ||||
							
								
								
									
										33
									
								
								src/dawn/native/d3d12/PipelineCacheD3D12.cpp
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										33
									
								
								src/dawn/native/d3d12/PipelineCacheD3D12.cpp
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,33 @@ | ||||
| // Copyright 2022 The Dawn Authors
 | ||||
| //
 | ||||
| // Licensed under the Apache License, Version 2.0 (the "License");
 | ||||
| // you may not use this file except in compliance with the License.
 | ||||
| // You may obtain a copy of the License at
 | ||||
| //
 | ||||
| //     http://www.apache.org/licenses/LICENSE-2.0
 | ||||
| //
 | ||||
| // Unless required by applicable law or agreed to in writing, software
 | ||||
| // distributed under the License is distributed on an "AS IS" BASIS,
 | ||||
| // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 | ||||
| // See the License for the specific language governing permissions and
 | ||||
| // limitations under the License.
 | ||||
| 
 | ||||
| #include "dawn/native/BlobCache.h" | ||||
| #include "dawn/native/d3d12/d3d12_platform.h" | ||||
| 
 | ||||
| namespace dawn::native { | ||||
| 
 | ||||
| // static
 | ||||
| CachedBlob CachedBlob::Create(ComPtr<ID3DBlob> blob) { | ||||
|     // Detach so the deleter callback can "own" the reference
 | ||||
|     ID3DBlob* ptr = blob.Detach(); | ||||
|     return CachedBlob(reinterpret_cast<uint8_t*>(ptr->GetBufferPointer()), ptr->GetBufferSize(), | ||||
|                       [=]() { | ||||
|                           // Reattach and drop to delete it.
 | ||||
|                           ComPtr<ID3DBlob> b; | ||||
|                           b.Attach(ptr); | ||||
|                           b = nullptr; | ||||
|                       }); | ||||
| } | ||||
| 
 | ||||
| }  // namespace dawn::native
 | ||||
| @ -252,10 +252,9 @@ MaybeError PipelineLayout::Initialize() { | ||||
|     rootSignatureDescriptor.pStaticSamplers = nullptr; | ||||
|     rootSignatureDescriptor.Flags = D3D12_ROOT_SIGNATURE_FLAG_ALLOW_INPUT_ASSEMBLER_INPUT_LAYOUT; | ||||
| 
 | ||||
|     ComPtr<ID3DBlob> signature; | ||||
|     ComPtr<ID3DBlob> error; | ||||
|     HRESULT hr = device->GetFunctions()->d3d12SerializeRootSignature( | ||||
|         &rootSignatureDescriptor, D3D_ROOT_SIGNATURE_VERSION_1, &signature, &error); | ||||
|         &rootSignatureDescriptor, D3D_ROOT_SIGNATURE_VERSION_1, &mRootSignatureBlob, &error); | ||||
|     if (DAWN_UNLIKELY(FAILED(hr))) { | ||||
|         std::ostringstream messageStream; | ||||
|         if (error) { | ||||
| @ -269,9 +268,10 @@ MaybeError PipelineLayout::Initialize() { | ||||
|         DAWN_TRY(CheckHRESULT(hr, messageStream.str().c_str())); | ||||
|     } | ||||
|     DAWN_TRY(CheckHRESULT(device->GetD3D12Device()->CreateRootSignature( | ||||
|                               0, signature->GetBufferPointer(), signature->GetBufferSize(), | ||||
|                               IID_PPV_ARGS(&mRootSignature)), | ||||
|                               0, mRootSignatureBlob->GetBufferPointer(), | ||||
|                               mRootSignatureBlob->GetBufferSize(), IID_PPV_ARGS(&mRootSignature)), | ||||
|                           "D3D12 create root signature")); | ||||
|     mCacheKey.Record(mRootSignatureBlob.Get()); | ||||
|     return {}; | ||||
| } | ||||
| 
 | ||||
| @ -310,6 +310,10 @@ ID3D12RootSignature* PipelineLayout::GetRootSignature() const { | ||||
|     return mRootSignature.Get(); | ||||
| } | ||||
| 
 | ||||
| ID3DBlob* PipelineLayout::GetRootSignatureBlob() const { | ||||
|     return mRootSignatureBlob.Get(); | ||||
| } | ||||
| 
 | ||||
| const PipelineLayout::DynamicStorageBufferLengthInfo& | ||||
| PipelineLayout::GetDynamicStorageBufferLengthInfo() const { | ||||
|     return mDynamicStorageBufferLengthInfo; | ||||
|  | ||||
| @ -52,6 +52,8 @@ class PipelineLayout final : public PipelineLayoutBase { | ||||
| 
 | ||||
|     ID3D12RootSignature* GetRootSignature() const; | ||||
| 
 | ||||
|     ID3DBlob* GetRootSignatureBlob() const; | ||||
| 
 | ||||
|     ID3D12CommandSignature* GetDispatchIndirectCommandSignatureWithNumWorkgroups(); | ||||
| 
 | ||||
|     ID3D12CommandSignature* GetDrawIndirectCommandSignatureWithInstanceVertexOffsets(); | ||||
| @ -98,6 +100,8 @@ class PipelineLayout final : public PipelineLayoutBase { | ||||
|     uint32_t mNumWorkgroupsParameterIndex; | ||||
|     uint32_t mDynamicStorageBufferLengthsParameterIndex; | ||||
|     ComPtr<ID3D12RootSignature> mRootSignature; | ||||
|     // Store the root signature blob to put in pipeline cachekey
 | ||||
|     ComPtr<ID3DBlob> mRootSignatureBlob; | ||||
|     ComPtr<ID3D12CommandSignature> mDispatchIndirectCommandSignatureWithNumWorkgroups; | ||||
|     ComPtr<ID3D12CommandSignature> mDrawIndirectCommandSignatureWithInstanceVertexOffsets; | ||||
|     ComPtr<ID3D12CommandSignature> mDrawIndexedIndirectCommandSignatureWithInstanceVertexOffsets; | ||||
|  | ||||
| @ -429,10 +429,29 @@ MaybeError RenderPipeline::Initialize() { | ||||
| 
 | ||||
|     mD3d12PrimitiveTopology = D3D12PrimitiveTopology(GetPrimitiveTopology()); | ||||
| 
 | ||||
|     mCacheKey.Record(descriptorD3D12, *layout->GetRootSignatureBlob()); | ||||
| 
 | ||||
|     // Try to see if we have anything in the blob cache.
 | ||||
|     CachedBlob blob = device->LoadCachedBlob(GetCacheKey()); | ||||
|     const bool cacheHit = !blob.Empty(); | ||||
|     if (cacheHit) { | ||||
|         // Cache hits, attach cached blob to descriptor.
 | ||||
|         descriptorD3D12.CachedPSO.pCachedBlob = blob.Data(); | ||||
|         descriptorD3D12.CachedPSO.CachedBlobSizeInBytes = blob.Size(); | ||||
|     } | ||||
| 
 | ||||
|     DAWN_TRY(CheckHRESULT(device->GetD3D12Device()->CreateGraphicsPipelineState( | ||||
|                               &descriptorD3D12, IID_PPV_ARGS(&mPipelineState)), | ||||
|                           "D3D12 create graphics pipeline state")); | ||||
| 
 | ||||
|     if (!cacheHit) { | ||||
|         // Cache misses, need to get pipeline cached blob and store.
 | ||||
|         ComPtr<ID3DBlob> d3dBlob; | ||||
|         DAWN_TRY(CheckHRESULT(GetPipelineState()->GetCachedBlob(&d3dBlob), | ||||
|                               "D3D12 render pipeline state get cached blob")); | ||||
|         device->StoreCachedBlob(GetCacheKey(), CachedBlob::Create(std::move(d3dBlob))); | ||||
|     } | ||||
| 
 | ||||
|     SetLabelImpl(); | ||||
| 
 | ||||
|     return {}; | ||||
|  | ||||
| @ -53,6 +53,8 @@ uint64_t Buffer::QueryMaxBufferLength(id<MTLDevice> mtlDevice) { | ||||
|     if (@available(macOS 10.11, *)) { | ||||
|         return 256 * 1024 * 1024; | ||||
|     } | ||||
|     // 256Mb for other platform if any. (Need to have a return for all branches). | ||||
|     return 256 * 1024 * 1024; | ||||
| #else | ||||
|     // macOS / tvOS: 256Mb limit in versions without [MTLDevice maxBufferLength] | ||||
|     return 256 * 1024 * 1024; | ||||
|  | ||||
| @ -50,10 +50,10 @@ VkPipelineCache PipelineCache::GetHandle() const { | ||||
|     return mHandle; | ||||
| } | ||||
| 
 | ||||
| ResultOrError<CachedBlob> PipelineCache::SerializeToBlobImpl() { | ||||
|     CachedBlob emptyBlob; | ||||
| MaybeError PipelineCache::SerializeToBlobImpl(CachedBlob* blob) { | ||||
|     if (mHandle == VK_NULL_HANDLE) { | ||||
|         return emptyBlob; | ||||
|         // Pipeline cache isn't created successfully
 | ||||
|         return {}; | ||||
|     } | ||||
| 
 | ||||
|     size_t bufferSize; | ||||
| @ -61,12 +61,13 @@ ResultOrError<CachedBlob> PipelineCache::SerializeToBlobImpl() { | ||||
|     DAWN_TRY(CheckVkSuccess( | ||||
|         device->fn.GetPipelineCacheData(device->GetVkDevice(), mHandle, &bufferSize, nullptr), | ||||
|         "GetPipelineCacheData")); | ||||
| 
 | ||||
|     CachedBlob blob(bufferSize); | ||||
|     DAWN_TRY(CheckVkSuccess( | ||||
|         device->fn.GetPipelineCacheData(device->GetVkDevice(), mHandle, &bufferSize, blob.Data()), | ||||
|     if (bufferSize > 0) { | ||||
|         *blob = CachedBlob::Create(bufferSize); | ||||
|         DAWN_TRY(CheckVkSuccess(device->fn.GetPipelineCacheData(device->GetVkDevice(), mHandle, | ||||
|                                                                 &bufferSize, blob->Data()), | ||||
|                                 "GetPipelineCacheData")); | ||||
|     return blob; | ||||
|     } | ||||
|     return {}; | ||||
| } | ||||
| 
 | ||||
| void PipelineCache::Initialize() { | ||||
|  | ||||
| @ -38,7 +38,7 @@ class PipelineCache final : public PipelineCacheBase { | ||||
|     ~PipelineCache() override; | ||||
| 
 | ||||
|     void Initialize(); | ||||
|     ResultOrError<CachedBlob> SerializeToBlobImpl() override; | ||||
|     MaybeError SerializeToBlobImpl(CachedBlob* blob) override; | ||||
| 
 | ||||
|     DeviceBase* mDevice; | ||||
|     VkPipelineCache mHandle = VK_NULL_HANDLE; | ||||
|  | ||||
| @ -26,18 +26,49 @@ using ::testing::NiceMock; | ||||
| 
 | ||||
| // TODO(dawn:549) Add some sort of pipeline descriptor repository to test more caching.
 | ||||
| 
 | ||||
| static constexpr std::string_view kComputeShader = R"( | ||||
| static constexpr std::string_view kComputeShaderDefault = R"( | ||||
|         @stage(compute) @workgroup_size(1) fn main() {} | ||||
|     )"; | ||||
| 
 | ||||
| static constexpr std::string_view kVertexShader = R"( | ||||
| static constexpr std::string_view kComputeShaderMultipleEntryPoints = R"( | ||||
|         @stage(compute) @workgroup_size(16) fn main() {} | ||||
|         @stage(compute) @workgroup_size(64) fn main2() {} | ||||
|     )"; | ||||
| 
 | ||||
| static constexpr std::string_view kVertexShaderDefault = R"( | ||||
|         @stage(vertex) fn main() -> @builtin(position) vec4<f32> { | ||||
|             return vec4<f32>(0.0, 0.0, 0.0, 0.0); | ||||
|         } | ||||
|     )"; | ||||
| 
 | ||||
| static constexpr std::string_view kFragmentShader = R"( | ||||
|         @stage(fragment) fn main() {} | ||||
| static constexpr std::string_view kVertexShaderMultipleEntryPoints = R"( | ||||
|         @stage(vertex) fn main() -> @builtin(position) vec4<f32> { | ||||
|             return vec4<f32>(1.0, 0.0, 0.0, 1.0); | ||||
|         } | ||||
| 
 | ||||
|         @stage(vertex) fn main2() -> @builtin(position) vec4<f32> { | ||||
|             return vec4<f32>(0.5, 0.5, 0.5, 1.0); | ||||
|         } | ||||
|     )"; | ||||
| 
 | ||||
| static constexpr std::string_view kFragmentShaderDefault = R"( | ||||
|         @stage(fragment) fn main() -> @location(0) vec4<f32> { | ||||
|             return vec4<f32>(0.1, 0.2, 0.3, 0.4); | ||||
|         } | ||||
|     )"; | ||||
| 
 | ||||
| static constexpr std::string_view kFragmentShaderMultipleOutput = R"( | ||||
|         struct FragmentOut { | ||||
|             @location(0) fragColor0 : vec4<f32>, | ||||
|             @location(1) fragColor1 : vec4<f32>, | ||||
|         } | ||||
| 
 | ||||
|         @stage(fragment) fn main() -> FragmentOut { | ||||
|             var output : FragmentOut; | ||||
|             output.fragColor0 = vec4<f32>(0.1, 0.2, 0.3, 0.4); | ||||
|             output.fragColor1 = vec4<f32>(0.5, 0.6, 0.7, 0.8); | ||||
|             return output; | ||||
|         } | ||||
|     )"; | ||||
| 
 | ||||
| class PipelineCachingTests : public DawnTest { | ||||
| @ -62,7 +93,7 @@ TEST_P(SinglePipelineCachingTests, ComputePipelineNoCache) { | ||||
|     { | ||||
|         wgpu::Device device = CreateDevice(); | ||||
|         wgpu::ComputePipelineDescriptor desc; | ||||
|         desc.compute.module = utils::CreateShaderModule(device, kComputeShader.data()); | ||||
|         desc.compute.module = utils::CreateShaderModule(device, kComputeShaderDefault.data()); | ||||
|         desc.compute.entryPoint = "main"; | ||||
|         EXPECT_CACHE_HIT(mMockCache, 0u, device.CreateComputePipeline(&desc)); | ||||
|     } | ||||
| @ -72,7 +103,7 @@ TEST_P(SinglePipelineCachingTests, ComputePipelineNoCache) { | ||||
|     { | ||||
|         wgpu::Device device = CreateDevice(); | ||||
|         wgpu::ComputePipelineDescriptor desc; | ||||
|         desc.compute.module = utils::CreateShaderModule(device, kComputeShader.data()); | ||||
|         desc.compute.module = utils::CreateShaderModule(device, kComputeShaderDefault.data()); | ||||
|         desc.compute.entryPoint = "main"; | ||||
|         EXPECT_CACHE_HIT(mMockCache, 0u, device.CreateComputePipeline(&desc)); | ||||
|     } | ||||
| @ -82,7 +113,7 @@ TEST_P(SinglePipelineCachingTests, ComputePipelineNoCache) { | ||||
| // Tests that pipeline creation on the same device uses frontend cache when possible.
 | ||||
| TEST_P(SinglePipelineCachingTests, ComputePipelineFrontedCache) { | ||||
|     wgpu::ComputePipelineDescriptor desc; | ||||
|     desc.compute.module = utils::CreateShaderModule(device, kComputeShader.data()); | ||||
|     desc.compute.module = utils::CreateShaderModule(device, kComputeShaderDefault.data()); | ||||
|     desc.compute.entryPoint = "main"; | ||||
| 
 | ||||
|     // First creation should create a cache entry.
 | ||||
| @ -106,7 +137,7 @@ TEST_P(SinglePipelineCachingTests, ComputePipelineBlobCache) { | ||||
|     { | ||||
|         wgpu::Device device = CreateDevice(); | ||||
|         wgpu::ComputePipelineDescriptor desc; | ||||
|         desc.compute.module = utils::CreateShaderModule(device, kComputeShader.data()); | ||||
|         desc.compute.module = utils::CreateShaderModule(device, kComputeShaderDefault.data()); | ||||
|         desc.compute.entryPoint = "main"; | ||||
|         EXPECT_CACHE_HIT(mMockCache, 0u, device.CreateComputePipeline(&desc)); | ||||
|     } | ||||
| @ -116,13 +147,74 @@ TEST_P(SinglePipelineCachingTests, ComputePipelineBlobCache) { | ||||
|     { | ||||
|         wgpu::Device device = CreateDevice(); | ||||
|         wgpu::ComputePipelineDescriptor desc; | ||||
|         desc.compute.module = utils::CreateShaderModule(device, kComputeShader.data()); | ||||
|         desc.compute.module = utils::CreateShaderModule(device, kComputeShaderDefault.data()); | ||||
|         desc.compute.entryPoint = "main"; | ||||
|         EXPECT_CACHE_HIT(mMockCache, 1u, device.CreateComputePipeline(&desc)); | ||||
|     } | ||||
|     EXPECT_EQ(mMockCache.GetNumEntries(), 1u); | ||||
| } | ||||
| 
 | ||||
| // Tests that pipeline creation hits the cache when using the same pipeline but with explicit
 | ||||
| // layout.
 | ||||
| TEST_P(SinglePipelineCachingTests, ComputePipelineBlobCacheExplictLayout) { | ||||
|     // First time should create and write out to the cache.
 | ||||
|     { | ||||
|         wgpu::Device device = CreateDevice(); | ||||
|         wgpu::ComputePipelineDescriptor desc; | ||||
|         desc.compute.module = utils::CreateShaderModule(device, kComputeShaderDefault.data()); | ||||
|         desc.compute.entryPoint = "main"; | ||||
|         EXPECT_CACHE_HIT(mMockCache, 0u, device.CreateComputePipeline(&desc)); | ||||
|     } | ||||
|     EXPECT_EQ(mMockCache.GetNumEntries(), 1u); | ||||
| 
 | ||||
|     // Cache should hit: use the same pipeline but with explicit pipeline layout.
 | ||||
|     { | ||||
|         wgpu::Device device = CreateDevice(); | ||||
|         wgpu::ComputePipelineDescriptor desc; | ||||
|         desc.compute.module = utils::CreateShaderModule(device, kComputeShaderDefault.data()); | ||||
|         desc.compute.entryPoint = "main"; | ||||
|         desc.layout = utils::MakeBasicPipelineLayout(device, {}); | ||||
|         EXPECT_CACHE_HIT(mMockCache, 1u, device.CreateComputePipeline(&desc)); | ||||
|     } | ||||
|     EXPECT_EQ(mMockCache.GetNumEntries(), 1u); | ||||
| } | ||||
| 
 | ||||
| // Tests that pipeline creation wouldn't hit the cache if the pipelines are not exactly the same.
 | ||||
| TEST_P(SinglePipelineCachingTests, ComputePipelineBlobCacheShaderNegativeCases) { | ||||
|     size_t numCacheEntries = 0u; | ||||
|     // First time should create and write out to the cache.
 | ||||
|     { | ||||
|         wgpu::Device device = CreateDevice(); | ||||
|         wgpu::ComputePipelineDescriptor desc; | ||||
|         desc.compute.module = utils::CreateShaderModule(device, kComputeShaderDefault.data()); | ||||
|         desc.compute.entryPoint = "main"; | ||||
|         EXPECT_CACHE_HIT(mMockCache, 0u, device.CreateComputePipeline(&desc)); | ||||
|     } | ||||
|     EXPECT_EQ(mMockCache.GetNumEntries(), ++numCacheEntries); | ||||
| 
 | ||||
|     // Cache should not hit: different shader module.
 | ||||
|     { | ||||
|         wgpu::Device device = CreateDevice(); | ||||
|         wgpu::ComputePipelineDescriptor desc; | ||||
|         desc.compute.module = | ||||
|             utils::CreateShaderModule(device, kComputeShaderMultipleEntryPoints.data()); | ||||
|         desc.compute.entryPoint = "main"; | ||||
|         EXPECT_CACHE_HIT(mMockCache, 0u, device.CreateComputePipeline(&desc)); | ||||
|     } | ||||
|     EXPECT_EQ(mMockCache.GetNumEntries(), ++numCacheEntries); | ||||
| 
 | ||||
|     // Cache should not hit: same shader module but different shader entry point.
 | ||||
|     { | ||||
|         wgpu::Device device = CreateDevice(); | ||||
|         wgpu::ComputePipelineDescriptor desc; | ||||
|         desc.compute.module = | ||||
|             utils::CreateShaderModule(device, kComputeShaderMultipleEntryPoints.data()); | ||||
|         desc.compute.entryPoint = "main2"; | ||||
|         EXPECT_CACHE_HIT(mMockCache, 0u, device.CreateComputePipeline(&desc)); | ||||
|     } | ||||
|     EXPECT_EQ(mMockCache.GetNumEntries(), ++numCacheEntries); | ||||
| } | ||||
| 
 | ||||
| // Tests that pipeline creation does not hits the cache when it is enabled but we use different
 | ||||
| // isolation keys.
 | ||||
| TEST_P(SinglePipelineCachingTests, ComputePipelineBlobCacheIsolationKey) { | ||||
| @ -130,7 +222,7 @@ TEST_P(SinglePipelineCachingTests, ComputePipelineBlobCacheIsolationKey) { | ||||
|     { | ||||
|         wgpu::Device device = CreateDevice("isolation key 1"); | ||||
|         wgpu::ComputePipelineDescriptor desc; | ||||
|         desc.compute.module = utils::CreateShaderModule(device, kComputeShader.data()); | ||||
|         desc.compute.module = utils::CreateShaderModule(device, kComputeShaderDefault.data()); | ||||
|         desc.compute.entryPoint = "main"; | ||||
|         EXPECT_CACHE_HIT(mMockCache, 0u, device.CreateComputePipeline(&desc)); | ||||
|     } | ||||
| @ -140,7 +232,7 @@ TEST_P(SinglePipelineCachingTests, ComputePipelineBlobCacheIsolationKey) { | ||||
|     { | ||||
|         wgpu::Device device = CreateDevice("isolation key 2"); | ||||
|         wgpu::ComputePipelineDescriptor desc; | ||||
|         desc.compute.module = utils::CreateShaderModule(device, kComputeShader.data()); | ||||
|         desc.compute.module = utils::CreateShaderModule(device, kComputeShaderDefault.data()); | ||||
|         desc.compute.entryPoint = "main"; | ||||
|         EXPECT_CACHE_HIT(mMockCache, 0u, device.CreateComputePipeline(&desc)); | ||||
|     } | ||||
| @ -158,10 +250,9 @@ TEST_P(SinglePipelineCachingTests, RenderPipelineNoCache) { | ||||
|     { | ||||
|         wgpu::Device device = CreateDevice(); | ||||
|         utils::ComboRenderPipelineDescriptor desc; | ||||
|         desc.cTargets[0].writeMask = wgpu::ColorWriteMask::None; | ||||
|         desc.vertex.module = utils::CreateShaderModule(device, kVertexShader.data()); | ||||
|         desc.vertex.module = utils::CreateShaderModule(device, kVertexShaderDefault.data()); | ||||
|         desc.vertex.entryPoint = "main"; | ||||
|         desc.cFragment.module = utils::CreateShaderModule(device, kFragmentShader.data()); | ||||
|         desc.cFragment.module = utils::CreateShaderModule(device, kFragmentShaderDefault.data()); | ||||
|         desc.cFragment.entryPoint = "main"; | ||||
|         EXPECT_CACHE_HIT(mMockCache, 0u, device.CreateRenderPipeline(&desc)); | ||||
|     } | ||||
| @ -171,10 +262,9 @@ TEST_P(SinglePipelineCachingTests, RenderPipelineNoCache) { | ||||
|     { | ||||
|         wgpu::Device device = CreateDevice(); | ||||
|         utils::ComboRenderPipelineDescriptor desc; | ||||
|         desc.cTargets[0].writeMask = wgpu::ColorWriteMask::None; | ||||
|         desc.vertex.module = utils::CreateShaderModule(device, kVertexShader.data()); | ||||
|         desc.vertex.module = utils::CreateShaderModule(device, kVertexShaderDefault.data()); | ||||
|         desc.vertex.entryPoint = "main"; | ||||
|         desc.cFragment.module = utils::CreateShaderModule(device, kFragmentShader.data()); | ||||
|         desc.cFragment.module = utils::CreateShaderModule(device, kFragmentShaderDefault.data()); | ||||
|         desc.cFragment.entryPoint = "main"; | ||||
|         EXPECT_CACHE_HIT(mMockCache, 0u, device.CreateRenderPipeline(&desc)); | ||||
|     } | ||||
| @ -184,10 +274,9 @@ TEST_P(SinglePipelineCachingTests, RenderPipelineNoCache) { | ||||
| // Tests that pipeline creation on the same device uses frontend cache when possible.
 | ||||
| TEST_P(SinglePipelineCachingTests, RenderPipelineFrontedCache) { | ||||
|     utils::ComboRenderPipelineDescriptor desc; | ||||
|     desc.cTargets[0].writeMask = wgpu::ColorWriteMask::None; | ||||
|     desc.vertex.module = utils::CreateShaderModule(device, kVertexShader.data()); | ||||
|     desc.vertex.module = utils::CreateShaderModule(device, kVertexShaderDefault.data()); | ||||
|     desc.vertex.entryPoint = "main"; | ||||
|     desc.cFragment.module = utils::CreateShaderModule(device, kFragmentShader.data()); | ||||
|     desc.cFragment.module = utils::CreateShaderModule(device, kFragmentShaderDefault.data()); | ||||
|     desc.cFragment.entryPoint = "main"; | ||||
| 
 | ||||
|     // First creation should create a cache entry.
 | ||||
| @ -211,10 +300,9 @@ TEST_P(SinglePipelineCachingTests, RenderPipelineBlobCache) { | ||||
|     { | ||||
|         wgpu::Device device = CreateDevice(); | ||||
|         utils::ComboRenderPipelineDescriptor desc; | ||||
|         desc.cTargets[0].writeMask = wgpu::ColorWriteMask::None; | ||||
|         desc.vertex.module = utils::CreateShaderModule(device, kVertexShader.data()); | ||||
|         desc.vertex.module = utils::CreateShaderModule(device, kVertexShaderDefault.data()); | ||||
|         desc.vertex.entryPoint = "main"; | ||||
|         desc.cFragment.module = utils::CreateShaderModule(device, kFragmentShader.data()); | ||||
|         desc.cFragment.module = utils::CreateShaderModule(device, kFragmentShaderDefault.data()); | ||||
|         desc.cFragment.entryPoint = "main"; | ||||
|         EXPECT_CACHE_HIT(mMockCache, 0u, device.CreateRenderPipeline(&desc)); | ||||
|     } | ||||
| @ -224,16 +312,172 @@ TEST_P(SinglePipelineCachingTests, RenderPipelineBlobCache) { | ||||
|     { | ||||
|         wgpu::Device device = CreateDevice(); | ||||
|         utils::ComboRenderPipelineDescriptor desc; | ||||
|         desc.cTargets[0].writeMask = wgpu::ColorWriteMask::None; | ||||
|         desc.vertex.module = utils::CreateShaderModule(device, kVertexShader.data()); | ||||
|         desc.vertex.module = utils::CreateShaderModule(device, kVertexShaderDefault.data()); | ||||
|         desc.vertex.entryPoint = "main"; | ||||
|         desc.cFragment.module = utils::CreateShaderModule(device, kFragmentShader.data()); | ||||
|         desc.cFragment.module = utils::CreateShaderModule(device, kFragmentShaderDefault.data()); | ||||
|         desc.cFragment.entryPoint = "main"; | ||||
|         EXPECT_CACHE_HIT(mMockCache, 1u, device.CreateRenderPipeline(&desc)); | ||||
|     } | ||||
|     EXPECT_EQ(mMockCache.GetNumEntries(), 1u); | ||||
| } | ||||
| 
 | ||||
| // Tests that pipeline creation hits the cache when using the same pipeline but with explicit
 | ||||
| // layout.
 | ||||
| TEST_P(SinglePipelineCachingTests, RenderPipelineBlobCacheExplictLayout) { | ||||
|     // First time should create and write out to the cache.
 | ||||
|     { | ||||
|         wgpu::Device device = CreateDevice(); | ||||
|         utils::ComboRenderPipelineDescriptor desc; | ||||
|         desc.vertex.module = utils::CreateShaderModule(device, kVertexShaderDefault.data()); | ||||
|         desc.vertex.entryPoint = "main"; | ||||
|         desc.cFragment.module = utils::CreateShaderModule(device, kFragmentShaderDefault.data()); | ||||
|         desc.cFragment.entryPoint = "main"; | ||||
|         EXPECT_CACHE_HIT(mMockCache, 0u, device.CreateRenderPipeline(&desc)); | ||||
|     } | ||||
|     EXPECT_EQ(mMockCache.GetNumEntries(), 1u); | ||||
| 
 | ||||
|     // Cache should hit: use the same pipeline but with explicit pipeline layout.
 | ||||
|     { | ||||
|         wgpu::Device device = CreateDevice(); | ||||
|         utils::ComboRenderPipelineDescriptor desc; | ||||
|         desc.vertex.module = utils::CreateShaderModule(device, kVertexShaderDefault.data()); | ||||
|         desc.vertex.entryPoint = "main"; | ||||
|         desc.cFragment.module = utils::CreateShaderModule(device, kFragmentShaderDefault.data()); | ||||
|         desc.cFragment.entryPoint = "main"; | ||||
|         desc.layout = utils::MakeBasicPipelineLayout(device, {}); | ||||
|         EXPECT_CACHE_HIT(mMockCache, 1u, device.CreateRenderPipeline(&desc)); | ||||
|     } | ||||
|     EXPECT_EQ(mMockCache.GetNumEntries(), 1u); | ||||
| } | ||||
| 
 | ||||
| // Tests that pipeline creation wouldn't hit the cache if the pipelines have different state set in
 | ||||
| // the descriptor.
 | ||||
| TEST_P(SinglePipelineCachingTests, RenderPipelineBlobCacheDescriptorNegativeCases) { | ||||
|     // First time should create and write out to the cache.
 | ||||
|     { | ||||
|         wgpu::Device device = CreateDevice(); | ||||
|         utils::ComboRenderPipelineDescriptor desc; | ||||
|         desc.vertex.module = utils::CreateShaderModule(device, kVertexShaderDefault.data()); | ||||
|         desc.vertex.entryPoint = "main"; | ||||
|         desc.cFragment.module = utils::CreateShaderModule(device, kFragmentShaderDefault.data()); | ||||
|         desc.cFragment.entryPoint = "main"; | ||||
|         EXPECT_CACHE_HIT(mMockCache, 0u, device.CreateRenderPipeline(&desc)); | ||||
|     } | ||||
|     EXPECT_EQ(mMockCache.GetNumEntries(), 1u); | ||||
| 
 | ||||
|     // Cache should not hit: different pipeline descriptor state.
 | ||||
|     { | ||||
|         wgpu::Device device = CreateDevice(); | ||||
|         utils::ComboRenderPipelineDescriptor desc; | ||||
|         desc.primitive.topology = wgpu::PrimitiveTopology::PointList; | ||||
|         desc.vertex.module = utils::CreateShaderModule(device, kVertexShaderDefault.data()); | ||||
|         desc.vertex.entryPoint = "main"; | ||||
|         desc.cFragment.module = utils::CreateShaderModule(device, kFragmentShaderDefault.data()); | ||||
|         desc.cFragment.entryPoint = "main"; | ||||
|         EXPECT_CACHE_HIT(mMockCache, 0u, device.CreateRenderPipeline(&desc)); | ||||
|     } | ||||
|     EXPECT_EQ(mMockCache.GetNumEntries(), 2u); | ||||
| } | ||||
| 
 | ||||
| // Tests that pipeline creation wouldn't hit the cache if the pipelines are not exactly the same in
 | ||||
| // terms of shader.
 | ||||
| TEST_P(SinglePipelineCachingTests, RenderPipelineBlobCacheShaderNegativeCases) { | ||||
|     size_t numCacheEntries = 0u; | ||||
|     // First time should create and write out to the cache.
 | ||||
|     { | ||||
|         wgpu::Device device = CreateDevice(); | ||||
|         utils::ComboRenderPipelineDescriptor desc; | ||||
|         desc.vertex.module = utils::CreateShaderModule(device, kVertexShaderDefault.data()); | ||||
|         desc.vertex.entryPoint = "main"; | ||||
|         desc.cFragment.module = utils::CreateShaderModule(device, kFragmentShaderDefault.data()); | ||||
|         desc.cFragment.entryPoint = "main"; | ||||
|         EXPECT_CACHE_HIT(mMockCache, 0u, device.CreateRenderPipeline(&desc)); | ||||
|     } | ||||
|     EXPECT_EQ(mMockCache.GetNumEntries(), ++numCacheEntries); | ||||
| 
 | ||||
|     // Cache should not hit: different shader module.
 | ||||
|     { | ||||
|         wgpu::Device device = CreateDevice(); | ||||
|         utils::ComboRenderPipelineDescriptor desc; | ||||
|         desc.vertex.module = | ||||
|             utils::CreateShaderModule(device, kVertexShaderMultipleEntryPoints.data()); | ||||
|         desc.vertex.entryPoint = "main"; | ||||
|         desc.cFragment.module = utils::CreateShaderModule(device, kFragmentShaderDefault.data()); | ||||
|         desc.cFragment.entryPoint = "main"; | ||||
|         EXPECT_CACHE_HIT(mMockCache, 0u, device.CreateRenderPipeline(&desc)); | ||||
|     } | ||||
|     EXPECT_EQ(mMockCache.GetNumEntries(), ++numCacheEntries); | ||||
| 
 | ||||
|     // Cache should not hit: same shader module but different shader entry point.
 | ||||
|     { | ||||
|         wgpu::Device device = CreateDevice(); | ||||
|         utils::ComboRenderPipelineDescriptor desc; | ||||
|         desc.vertex.module = | ||||
|             utils::CreateShaderModule(device, kVertexShaderMultipleEntryPoints.data()); | ||||
|         desc.vertex.entryPoint = "main2"; | ||||
|         desc.cFragment.module = utils::CreateShaderModule(device, kFragmentShaderDefault.data()); | ||||
|         desc.cFragment.entryPoint = "main"; | ||||
|         EXPECT_CACHE_HIT(mMockCache, 0u, device.CreateRenderPipeline(&desc)); | ||||
|     } | ||||
|     EXPECT_EQ(mMockCache.GetNumEntries(), ++numCacheEntries); | ||||
| } | ||||
| 
 | ||||
| // Tests that pipeline creation wouldn't hit the cache if the pipelines are not exactly the same
 | ||||
| // (fragment color targets differences).
 | ||||
| TEST_P(SinglePipelineCachingTests, RenderPipelineBlobCacheNegativeCasesFragmentColorTargets) { | ||||
|     size_t numCacheEntries = 0u; | ||||
|     // First time should create and write out to the cache.
 | ||||
|     { | ||||
|         wgpu::Device device = CreateDevice(); | ||||
|         utils::ComboRenderPipelineDescriptor desc; | ||||
|         desc.cFragment.targetCount = 2; | ||||
|         desc.cTargets[0].format = wgpu::TextureFormat::RGBA8Unorm; | ||||
|         desc.cTargets[1].writeMask = wgpu::ColorWriteMask::None; | ||||
|         desc.cTargets[1].format = wgpu::TextureFormat::RGBA8Unorm; | ||||
|         desc.vertex.module = utils::CreateShaderModule(device, kVertexShaderDefault.data()); | ||||
|         desc.vertex.entryPoint = "main"; | ||||
|         desc.cFragment.module = | ||||
|             utils::CreateShaderModule(device, kFragmentShaderMultipleOutput.data()); | ||||
|         desc.cFragment.entryPoint = "main"; | ||||
|         EXPECT_CACHE_HIT(mMockCache, 0u, device.CreateRenderPipeline(&desc)); | ||||
|     } | ||||
|     EXPECT_EQ(mMockCache.GetNumEntries(), ++numCacheEntries); | ||||
| 
 | ||||
|     // Cache should not hit: different fragment color target state (sparse).
 | ||||
|     { | ||||
|         wgpu::Device device = CreateDevice(); | ||||
|         utils::ComboRenderPipelineDescriptor desc; | ||||
|         desc.cFragment.targetCount = 2; | ||||
|         desc.cTargets[0].format = wgpu::TextureFormat::Undefined; | ||||
|         desc.cTargets[1].writeMask = wgpu::ColorWriteMask::None; | ||||
|         desc.cTargets[1].format = wgpu::TextureFormat::RGBA8Unorm; | ||||
|         desc.vertex.module = utils::CreateShaderModule(device, kVertexShaderDefault.data()); | ||||
|         desc.vertex.entryPoint = "main"; | ||||
|         desc.cFragment.module = | ||||
|             utils::CreateShaderModule(device, kFragmentShaderMultipleOutput.data()); | ||||
|         desc.cFragment.entryPoint = "main"; | ||||
|         EXPECT_CACHE_HIT(mMockCache, 0u, device.CreateRenderPipeline(&desc)); | ||||
|     } | ||||
|     EXPECT_EQ(mMockCache.GetNumEntries(), ++numCacheEntries); | ||||
| 
 | ||||
|     // Cache should not hit: different fragment color target state (trailing empty).
 | ||||
|     { | ||||
|         wgpu::Device device = CreateDevice(); | ||||
|         utils::ComboRenderPipelineDescriptor desc; | ||||
|         desc.cFragment.targetCount = 2; | ||||
|         desc.cTargets[0].format = wgpu::TextureFormat::RGBA8Unorm; | ||||
|         desc.cTargets[1].writeMask = wgpu::ColorWriteMask::None; | ||||
|         desc.cTargets[1].format = wgpu::TextureFormat::Undefined; | ||||
|         desc.vertex.module = utils::CreateShaderModule(device, kVertexShaderDefault.data()); | ||||
|         desc.vertex.entryPoint = "main"; | ||||
|         desc.cFragment.module = | ||||
|             utils::CreateShaderModule(device, kFragmentShaderMultipleOutput.data()); | ||||
|         desc.cFragment.entryPoint = "main"; | ||||
|         EXPECT_CACHE_HIT(mMockCache, 0u, device.CreateRenderPipeline(&desc)); | ||||
|     } | ||||
|     EXPECT_EQ(mMockCache.GetNumEntries(), ++numCacheEntries); | ||||
| } | ||||
| 
 | ||||
| // Tests that pipeline creation does not hits the cache when it is enabled but we use different
 | ||||
| // isolation keys.
 | ||||
| TEST_P(SinglePipelineCachingTests, RenderPipelineBlobCacheIsolationKey) { | ||||
| @ -241,10 +485,9 @@ TEST_P(SinglePipelineCachingTests, RenderPipelineBlobCacheIsolationKey) { | ||||
|     { | ||||
|         wgpu::Device device = CreateDevice("isolation key 1"); | ||||
|         utils::ComboRenderPipelineDescriptor desc; | ||||
|         desc.cTargets[0].writeMask = wgpu::ColorWriteMask::None; | ||||
|         desc.vertex.module = utils::CreateShaderModule(device, kVertexShader.data()); | ||||
|         desc.vertex.module = utils::CreateShaderModule(device, kVertexShaderDefault.data()); | ||||
|         desc.vertex.entryPoint = "main"; | ||||
|         desc.cFragment.module = utils::CreateShaderModule(device, kFragmentShader.data()); | ||||
|         desc.cFragment.module = utils::CreateShaderModule(device, kFragmentShaderDefault.data()); | ||||
|         desc.cFragment.entryPoint = "main"; | ||||
|         EXPECT_CACHE_HIT(mMockCache, 0u, device.CreateRenderPipeline(&desc)); | ||||
|     } | ||||
| @ -254,16 +497,17 @@ TEST_P(SinglePipelineCachingTests, RenderPipelineBlobCacheIsolationKey) { | ||||
|     { | ||||
|         wgpu::Device device = CreateDevice("isolation key 2"); | ||||
|         utils::ComboRenderPipelineDescriptor desc; | ||||
|         desc.cTargets[0].writeMask = wgpu::ColorWriteMask::None; | ||||
|         desc.vertex.module = utils::CreateShaderModule(device, kVertexShader.data()); | ||||
|         desc.vertex.module = utils::CreateShaderModule(device, kVertexShaderDefault.data()); | ||||
|         desc.vertex.entryPoint = "main"; | ||||
|         desc.cFragment.module = utils::CreateShaderModule(device, kFragmentShader.data()); | ||||
|         desc.cFragment.module = utils::CreateShaderModule(device, kFragmentShaderDefault.data()); | ||||
|         desc.cFragment.entryPoint = "main"; | ||||
|         EXPECT_CACHE_HIT(mMockCache, 0u, device.CreateRenderPipeline(&desc)); | ||||
|     } | ||||
|     EXPECT_EQ(mMockCache.GetNumEntries(), 2u); | ||||
| } | ||||
| 
 | ||||
| DAWN_INSTANTIATE_TEST(SinglePipelineCachingTests, VulkanBackend({"enable_blob_cache"})); | ||||
| DAWN_INSTANTIATE_TEST(SinglePipelineCachingTests, | ||||
|                       VulkanBackend({"enable_blob_cache"}), | ||||
|                       D3D12Backend({"enable_blob_cache"})); | ||||
| 
 | ||||
| }  // namespace
 | ||||
|  | ||||
		Loading…
	
	
			
			x
			
			
		
	
		Reference in New Issue
	
	Block a user