#include "../win/Win32Common.hpp" #include "logvisor/logvisor.hpp" #include "boo/graphicsdev/D3D.hpp" #include "boo/IGraphicsContext.hpp" #include "Common.hpp" #include #include #include #include #include #include #include #include #include #include "xxhash.h" #undef min #undef max extern pD3DCompile D3DCompilePROC; static const char* GammaVS = "struct VertData\n" "{\n" " float4 posIn : POSITION;\n" " float4 uvIn : UV;\n" "};\n" "\n" "struct VertToFrag\n" "{\n" " float4 pos : SV_Position;\n" " float2 uv : UV;\n" "};\n" "\n" "VertToFrag main(in VertData v)\n" "{\n" " VertToFrag vtf;\n" " vtf.uv = v.uvIn.xy;\n" " vtf.pos = v.posIn;\n" " return vtf;\n" "}\n"; static const char* GammaFS = "struct VertToFrag\n" "{\n" " float4 pos : SV_Position;\n" " float2 uv : UV;\n" "};\n" "\n" "Texture2D screenTex : register(t0);\n" "Texture2D gammaLUT : register(t1);\n" "SamplerState samp : register(s2);\n" "float4 main(in VertToFrag vtf) : SV_Target0\n" "{\n" " int4 tex = int4(saturate(screenTex.Sample(samp, vtf.uv)) * float4(65535.0, 65535.0, 65535.0, 65535.0));\n" " float4 colorOut;\n" " for (int i=0 ; i<3 ; ++i)\n" " colorOut[i] = gammaLUT.Load(int3(tex[i] % 256, tex[i] / 256, 0)).r;\n" " return colorOut;\n" "}\n"; namespace boo { static logvisor::Module Log("boo::D3D11"); class D3D11DataFactory; struct D3D11ShareableShader : IShareableShader { ComPtr m_shader; ComPtr m_vtxBlob; D3D11ShareableShader(D3D11DataFactory& fac, uint64_t srcKey, uint64_t binKey, ComPtr&& s, ComPtr&& vb) : IShareableShader(fac, srcKey, binKey), m_shader(std::move(s)), m_vtxBlob(std::move(vb)) {} D3D11ShareableShader(D3D11DataFactory& fac, uint64_t srcKey, uint64_t binKey, ComPtr&& s) : IShareableShader(fac, srcKey, binKey), m_shader(std::move(s)) {} }; static inline void ThrowIfFailed(HRESULT hr) { if (FAILED(hr)) { // Set a breakpoint on this line to catch Win32 API errors. #if !WINDOWS_STORE _com_error err(hr); #else _com_error err(hr, L"D3D11 fail"); #endif LPCTSTR errMsg = err.ErrorMessage(); Log.report(logvisor::Fatal, errMsg); } } static const D3D11_BIND_FLAG USE_TABLE[] = { D3D11_BIND_VERTEX_BUFFER, D3D11_BIND_VERTEX_BUFFER, D3D11_BIND_INDEX_BUFFER, D3D11_BIND_CONSTANT_BUFFER }; class D3D11GraphicsBufferS : public GraphicsDataNode { friend class D3D11DataFactory; friend struct D3D11CommandQueue; size_t m_sz; D3D11GraphicsBufferS(const boo::ObjToken& parent, BufferUse use, D3D11Context* ctx, const void* data, size_t stride, size_t count) : GraphicsDataNode(parent), m_sz(stride * count), m_stride(stride), m_count(count) { D3D11_SUBRESOURCE_DATA iData = {data}; CD3D11_BUFFER_DESC desc(m_sz, USE_TABLE[int(use)], D3D11_USAGE_IMMUTABLE); ThrowIfFailed(ctx->m_dev->CreateBuffer(&desc, &iData, &m_buf)); } public: size_t m_stride; size_t m_count; ComPtr m_buf; ~D3D11GraphicsBufferS() = default; }; template class D3D11GraphicsBufferD : public GraphicsDataNode { friend class D3D11DataFactory; friend struct D3D11CommandQueue; D3D11CommandQueue* m_q; std::unique_ptr m_cpuBuf; size_t m_cpuSz; int m_validSlots = 0; D3D11GraphicsBufferD(const boo::ObjToken& parent, D3D11CommandQueue* q, BufferUse use, D3D11Context* ctx, size_t stride, size_t count) : GraphicsDataNode(parent), m_q(q), m_stride(stride), m_count(count) { m_cpuSz = stride * count; m_cpuBuf.reset(new uint8_t[m_cpuSz]); for (int i=0 ; i<3 ; ++i) { CD3D11_BUFFER_DESC desc(m_cpuSz, USE_TABLE[int(use)], D3D11_USAGE_DYNAMIC, D3D11_CPU_ACCESS_WRITE); ThrowIfFailed(ctx->m_dev->CreateBuffer(&desc, nullptr, &m_bufs[i])); } } void update(ID3D11DeviceContext* ctx, int b); public: size_t m_stride; size_t m_count; ComPtr m_bufs[3]; ~D3D11GraphicsBufferD() = default; void load(const void* data, size_t sz); void* map(size_t sz); void unmap(); }; class D3D11TextureS : public GraphicsDataNode { friend class D3D11DataFactory; D3D11TextureS(const boo::ObjToken& parent, D3D11Context* ctx, size_t width, size_t height, size_t mips, TextureFormat fmt, const void* data, size_t sz) : GraphicsDataNode(parent) { DXGI_FORMAT pfmt = DXGI_FORMAT_UNKNOWN; int pxPitchNum = 1; int pxPitchDenom = 1; bool compressed = false; switch (fmt) { case TextureFormat::RGBA8: pfmt = DXGI_FORMAT_R8G8B8A8_UNORM; pxPitchNum = 4; break; case TextureFormat::I8: pfmt = DXGI_FORMAT_R8_UNORM; break; case TextureFormat::I16: pfmt = DXGI_FORMAT_R16_UNORM; pxPitchNum = 2; break; case TextureFormat::DXT1: pfmt = DXGI_FORMAT_BC1_UNORM; compressed = true; pxPitchNum = 1; pxPitchDenom = 2; break; default: Log.report(logvisor::Fatal, "unsupported tex format"); } CD3D11_TEXTURE2D_DESC desc(pfmt, width, height, 1, mips, D3D11_BIND_SHADER_RESOURCE, D3D11_USAGE_IMMUTABLE); const uint8_t* dataIt = static_cast(data); D3D11_SUBRESOURCE_DATA upData[16] = {}; for (size_t i=0 ; i 1) width /= 2; if (height > 1) height /= 2; } ThrowIfFailed(ctx->m_dev->CreateTexture2D(&desc, upData, &m_tex)); CD3D11_SHADER_RESOURCE_VIEW_DESC srvDesc(m_tex.Get(), D3D_SRV_DIMENSION_TEXTURE2D, pfmt, 0, mips); ThrowIfFailed(ctx->m_dev->CreateShaderResourceView(m_tex.Get(), &srvDesc, &m_srv)); } public: ComPtr m_tex; ComPtr m_srv; ~D3D11TextureS() = default; }; class D3D11TextureSA : public GraphicsDataNode { friend class D3D11DataFactory; D3D11TextureSA(const boo::ObjToken& parent, D3D11Context* ctx, size_t width, size_t height, size_t layers, size_t mips, TextureFormat fmt, const void* data, size_t sz) : GraphicsDataNode(parent) { size_t pixelPitch = 0; DXGI_FORMAT pixelFmt = DXGI_FORMAT_UNKNOWN; switch (fmt) { case TextureFormat::RGBA8: pixelPitch = 4; pixelFmt = DXGI_FORMAT_R8G8B8A8_UNORM; break; case TextureFormat::I8: pixelPitch = 1; pixelFmt = DXGI_FORMAT_R8_UNORM; break; case TextureFormat::I16: pixelPitch = 2; pixelFmt = DXGI_FORMAT_R16_UNORM; break; default: Log.report(logvisor::Fatal, "unsupported tex format"); } CD3D11_TEXTURE2D_DESC desc(pixelFmt, width, height, layers, mips, D3D11_BIND_SHADER_RESOURCE, D3D11_USAGE_IMMUTABLE); const uint8_t* dataIt = static_cast(data); std::unique_ptr upData(new D3D11_SUBRESOURCE_DATA[layers * mips]); D3D11_SUBRESOURCE_DATA* outIt = upData.get(); for (size_t i=0 ; ipSysMem = dataIt; outIt->SysMemPitch = width * pixelPitch; outIt->SysMemSlicePitch = outIt->SysMemPitch * height; dataIt += outIt->SysMemSlicePitch; ++outIt; } if (width > 1) width /= 2; if (height > 1) height /= 2; } ThrowIfFailed(ctx->m_dev->CreateTexture2D(&desc, upData.get(), &m_tex)); CD3D11_SHADER_RESOURCE_VIEW_DESC srvDesc(m_tex.Get(), D3D_SRV_DIMENSION_TEXTURE2DARRAY, pixelFmt); ThrowIfFailed(ctx->m_dev->CreateShaderResourceView(m_tex.Get(), &srvDesc, &m_srv)); } public: ComPtr m_tex; ComPtr m_srv; ~D3D11TextureSA() = default; }; class D3D11TextureD : public GraphicsDataNode { friend class D3D11DataFactory; friend struct D3D11CommandQueue; size_t m_width = 0; D3D11CommandQueue* m_q; std::unique_ptr m_cpuBuf; size_t m_cpuSz; size_t m_pxPitch; int m_validSlots = 0; D3D11TextureD(const boo::ObjToken& parent, D3D11CommandQueue* q, D3D11Context* ctx, size_t width, size_t height, TextureFormat fmt) : GraphicsDataNode(parent), m_width(width), m_q(q) { DXGI_FORMAT pixelFmt = DXGI_FORMAT_UNKNOWN; switch (fmt) { case TextureFormat::RGBA8: pixelFmt = DXGI_FORMAT_R8G8B8A8_UNORM; m_pxPitch = 4; break; case TextureFormat::I8: pixelFmt = DXGI_FORMAT_R8_UNORM; m_pxPitch = 1; break; case TextureFormat::I16: pixelFmt = DXGI_FORMAT_R16_UNORM; m_pxPitch = 2; break; default: Log.report(logvisor::Fatal, "unsupported tex format"); } m_cpuSz = width * height * m_pxPitch; m_cpuBuf.reset(new uint8_t[m_cpuSz]); CD3D11_TEXTURE2D_DESC desc(pixelFmt, width, height, 1, 1, D3D11_BIND_SHADER_RESOURCE, D3D11_USAGE_DYNAMIC, D3D11_CPU_ACCESS_WRITE); for (int i=0 ; i<3 ; ++i) { ThrowIfFailed(ctx->m_dev->CreateTexture2D(&desc, nullptr, &m_texs[i])); CD3D11_SHADER_RESOURCE_VIEW_DESC srvDesc(m_texs[i].Get(), D3D_SRV_DIMENSION_TEXTURE2D, pixelFmt); ThrowIfFailed(ctx->m_dev->CreateShaderResourceView(m_texs[i].Get(), &srvDesc, &m_srvs[i])); } } void update(ID3D11DeviceContext* ctx, int b); public: ComPtr m_texs[3]; ComPtr m_srvs[3]; ~D3D11TextureD() = default; void load(const void* data, size_t sz); void* map(size_t sz); void unmap(); }; #define MAX_BIND_TEXS 4 class D3D11TextureR : public GraphicsDataNode { friend class D3D11DataFactory; friend struct D3D11CommandQueue; size_t m_width = 0; size_t m_height = 0; size_t m_samples = 0; size_t m_colorBindCount; size_t m_depthBindCount; void Setup(D3D11Context* ctx) { CD3D11_TEXTURE2D_DESC colorDesc(ctx->m_fbFormat, m_width, m_height, 1, 1, D3D11_BIND_RENDER_TARGET, D3D11_USAGE_DEFAULT, 0, m_samples); ThrowIfFailed(ctx->m_dev->CreateTexture2D(&colorDesc, nullptr, &m_colorTex)); CD3D11_TEXTURE2D_DESC depthDesc(DXGI_FORMAT_D32_FLOAT, m_width, m_height, 1, 1, D3D11_BIND_DEPTH_STENCIL, D3D11_USAGE_DEFAULT, 0, m_samples); ThrowIfFailed(ctx->m_dev->CreateTexture2D(&depthDesc, nullptr, &m_depthTex)); D3D11_RTV_DIMENSION rtvDim; D3D11_DSV_DIMENSION dsvDim; if (m_samples > 1) { rtvDim = D3D11_RTV_DIMENSION_TEXTURE2DMS; dsvDim = D3D11_DSV_DIMENSION_TEXTURE2DMS; } else { rtvDim = D3D11_RTV_DIMENSION_TEXTURE2D; dsvDim = D3D11_DSV_DIMENSION_TEXTURE2D; } CD3D11_RENDER_TARGET_VIEW_DESC rtvDesc(m_colorTex.Get(), rtvDim); ThrowIfFailed(ctx->m_dev->CreateRenderTargetView(m_colorTex.Get(), &rtvDesc, &m_rtv)); CD3D11_DEPTH_STENCIL_VIEW_DESC dsvDesc(m_depthTex.Get(), dsvDim); ThrowIfFailed(ctx->m_dev->CreateDepthStencilView(m_depthTex.Get(), &dsvDesc, &m_dsv)); for (size_t i=0 ; im_fbFormat, m_width, m_height, 1, 1, D3D11_BIND_SHADER_RESOURCE, D3D11_USAGE_DEFAULT, 0, 1); ThrowIfFailed(ctx->m_dev->CreateTexture2D(&colorBindDesc, nullptr, &m_colorBindTex[i])); CD3D11_SHADER_RESOURCE_VIEW_DESC colorSrvDesc(m_colorBindTex[i].Get(), D3D11_SRV_DIMENSION_TEXTURE2D); ThrowIfFailed(ctx->m_dev->CreateShaderResourceView(m_colorBindTex[i].Get(), &colorSrvDesc, &m_colorSrv[i])); } for (size_t i=0 ; im_dev->CreateTexture2D(&depthBindDesc, nullptr, &m_depthBindTex[i])); CD3D11_SHADER_RESOURCE_VIEW_DESC depthSrvDesc(m_depthBindTex[i].Get(), D3D11_SRV_DIMENSION_TEXTURE2D, DXGI_FORMAT_R32_FLOAT); ThrowIfFailed(ctx->m_dev->CreateShaderResourceView(m_depthBindTex[i].Get(), &depthSrvDesc, &m_depthSrv[i])); } } D3D11TextureR(const boo::ObjToken& parent, D3D11Context* ctx, size_t width, size_t height, size_t samples, size_t colorBindCount, size_t depthBindCount) : GraphicsDataNode(parent), m_width(width), m_height(height), m_samples(samples), m_colorBindCount(colorBindCount), m_depthBindCount(depthBindCount) { if (colorBindCount > MAX_BIND_TEXS) Log.report(logvisor::Fatal, "too many color bindings for render texture"); if (depthBindCount > MAX_BIND_TEXS) Log.report(logvisor::Fatal, "too many depth bindings for render texture"); if (samples == 0) m_samples = 1; Setup(ctx); } public: size_t samples() const {return m_samples;} ComPtr m_colorTex; ComPtr m_rtv; ComPtr m_depthTex; ComPtr m_dsv; ComPtr m_colorBindTex[MAX_BIND_TEXS]; ComPtr m_colorSrv[MAX_BIND_TEXS]; ComPtr m_depthBindTex[MAX_BIND_TEXS]; ComPtr m_depthSrv[MAX_BIND_TEXS]; ~D3D11TextureR() = default; void resize(D3D11Context* ctx, size_t width, size_t height) { if (width < 1) width = 1; if (height < 1) height = 1; m_width = width; m_height = height; Setup(ctx); } }; static const size_t SEMANTIC_SIZE_TABLE[] = { 0, 12, 16, 12, 16, 16, 4, 8, 16, 16, 16 }; static const char* SEMANTIC_NAME_TABLE[] = { nullptr, "POSITION", "POSITION", "NORMAL", "NORMAL", "COLOR", "COLOR", "UV", "UV", "WEIGHT", "MODELVIEW" }; static const DXGI_FORMAT SEMANTIC_TYPE_TABLE[] = { DXGI_FORMAT_UNKNOWN, DXGI_FORMAT_R32G32B32_FLOAT, DXGI_FORMAT_R32G32B32A32_FLOAT, DXGI_FORMAT_R32G32B32_FLOAT, DXGI_FORMAT_R32G32B32A32_FLOAT, DXGI_FORMAT_R32G32B32A32_FLOAT, DXGI_FORMAT_R8G8B8A8_UNORM, DXGI_FORMAT_R32G32_FLOAT, DXGI_FORMAT_R32G32B32A32_FLOAT, DXGI_FORMAT_R32G32B32A32_FLOAT, DXGI_FORMAT_R32G32B32A32_FLOAT }; struct D3D11VertexFormat : GraphicsDataNode { size_t m_elementCount; std::unique_ptr m_elements; size_t m_stride = 0; size_t m_instStride = 0; D3D11VertexFormat(const boo::ObjToken& parent, size_t elementCount, const VertexElementDescriptor* elements) : GraphicsDataNode(parent), m_elementCount(elementCount), m_elements(new D3D11_INPUT_ELEMENT_DESC[elementCount]) { memset(m_elements.get(), 0, elementCount * sizeof(D3D11_INPUT_ELEMENT_DESC)); for (size_t i=0 ; isemantic & boo::VertexSemantic::SemanticMask); elem.SemanticName = SEMANTIC_NAME_TABLE[semantic]; elem.SemanticIndex = elemin->semanticIdx; elem.Format = SEMANTIC_TYPE_TABLE[semantic]; if ((elemin->semantic & boo::VertexSemantic::Instanced) != boo::VertexSemantic::None) { elem.InputSlotClass = D3D11_INPUT_PER_INSTANCE_DATA; elem.InstanceDataStepRate = 1; elem.InputSlot = 1; elem.AlignedByteOffset = m_instStride; m_instStride += SEMANTIC_SIZE_TABLE[semantic]; } else { elem.InputSlotClass = D3D11_INPUT_PER_VERTEX_DATA; elem.AlignedByteOffset = m_stride; m_stride += SEMANTIC_SIZE_TABLE[semantic]; } } } }; static const D3D11_PRIMITIVE_TOPOLOGY PRIMITIVE_TABLE[] = { D3D10_PRIMITIVE_TOPOLOGY_TRIANGLELIST, D3D10_PRIMITIVE_TOPOLOGY_TRIANGLESTRIP }; static const D3D11_BLEND BLEND_FACTOR_TABLE[] = { D3D11_BLEND_ZERO, D3D11_BLEND_ONE, D3D11_BLEND_SRC_COLOR, D3D11_BLEND_INV_SRC_COLOR, D3D11_BLEND_DEST_COLOR, D3D11_BLEND_INV_DEST_COLOR, D3D11_BLEND_SRC_ALPHA, D3D11_BLEND_INV_SRC_ALPHA, D3D11_BLEND_DEST_ALPHA, D3D11_BLEND_INV_DEST_ALPHA, D3D11_BLEND_SRC1_COLOR, D3D11_BLEND_INV_SRC1_COLOR }; class D3D11ShaderPipeline : public GraphicsDataNode { friend class D3D11DataFactory; friend struct D3D11ShaderDataBinding; boo::ObjToken m_vtxFmt; D3D11ShareableShader::Token m_vert; D3D11ShareableShader::Token m_pixel; D3D11ShaderPipeline(const boo::ObjToken& parent, D3D11Context* ctx, D3D11ShareableShader::Token&& vert, D3D11ShareableShader::Token&& pixel, const boo::ObjToken& vtxFmt, BlendFactor srcFac, BlendFactor dstFac, Primitive prim, ZTest depthTest, bool depthWrite, bool colorWrite, bool alphaWrite, bool overwriteAlpha, CullMode culling) : GraphicsDataNode(parent), m_vtxFmt(vtxFmt), m_vert(std::move(vert)), m_pixel(std::move(pixel)), m_topology(PRIMITIVE_TABLE[int(prim)]) { m_vert.get().m_shader.As(&m_vShader); m_pixel.get().m_shader.As(&m_pShader); D3D11_CULL_MODE cullMode; switch (culling) { case CullMode::None: default: cullMode = D3D11_CULL_NONE; break; case CullMode::Backface: cullMode = D3D11_CULL_BACK; break; case CullMode::Frontface: cullMode = D3D11_CULL_FRONT; break; } CD3D11_RASTERIZER_DESC rasDesc(D3D11_FILL_SOLID, cullMode, true, D3D11_DEFAULT_DEPTH_BIAS, D3D11_DEFAULT_DEPTH_BIAS_CLAMP, D3D11_DEFAULT_SLOPE_SCALED_DEPTH_BIAS, true, true, false, false); ThrowIfFailed(ctx->m_dev->CreateRasterizerState(&rasDesc, &m_rasState)); CD3D11_DEPTH_STENCIL_DESC dsDesc(D3D11_DEFAULT); dsDesc.DepthEnable = depthTest != ZTest::None; dsDesc.DepthWriteMask = D3D11_DEPTH_WRITE_MASK(depthWrite); switch (depthTest) { case ZTest::None: default: dsDesc.DepthFunc = D3D11_COMPARISON_ALWAYS; break; case ZTest::LEqual: dsDesc.DepthFunc = D3D11_COMPARISON_GREATER_EQUAL; break; case ZTest::Greater: dsDesc.DepthFunc = D3D11_COMPARISON_LESS; break; case ZTest::GEqual: dsDesc.DepthFunc = D3D11_COMPARISON_LESS_EQUAL; break; case ZTest::Equal: dsDesc.DepthFunc = D3D11_COMPARISON_EQUAL; break; } ThrowIfFailed(ctx->m_dev->CreateDepthStencilState(&dsDesc, &m_dsState)); CD3D11_BLEND_DESC blDesc(D3D11_DEFAULT); blDesc.RenderTarget[0].BlendEnable = (dstFac != BlendFactor::Zero); if (srcFac == BlendFactor::Subtract || dstFac == BlendFactor::Subtract) { blDesc.RenderTarget[0].SrcBlend = D3D11_BLEND_SRC_ALPHA; blDesc.RenderTarget[0].DestBlend = D3D11_BLEND_ONE; blDesc.RenderTarget[0].BlendOp = D3D11_BLEND_OP_REV_SUBTRACT; if (overwriteAlpha) { blDesc.RenderTarget[0].SrcBlendAlpha = D3D11_BLEND_ONE; blDesc.RenderTarget[0].DestBlendAlpha = D3D11_BLEND_ZERO; blDesc.RenderTarget[0].BlendOpAlpha = D3D11_BLEND_OP_ADD; } else { blDesc.RenderTarget[0].SrcBlendAlpha = D3D11_BLEND_SRC_ALPHA; blDesc.RenderTarget[0].DestBlendAlpha = D3D11_BLEND_ONE; blDesc.RenderTarget[0].BlendOpAlpha = D3D11_BLEND_OP_REV_SUBTRACT; } } else { blDesc.RenderTarget[0].SrcBlend = BLEND_FACTOR_TABLE[int(srcFac)]; blDesc.RenderTarget[0].DestBlend = BLEND_FACTOR_TABLE[int(dstFac)]; blDesc.RenderTarget[0].BlendOp = D3D11_BLEND_OP_ADD; if (overwriteAlpha) { blDesc.RenderTarget[0].SrcBlendAlpha = D3D11_BLEND_ONE; blDesc.RenderTarget[0].DestBlendAlpha = D3D11_BLEND_ZERO; } else { blDesc.RenderTarget[0].SrcBlendAlpha = BLEND_FACTOR_TABLE[int(srcFac)]; blDesc.RenderTarget[0].DestBlendAlpha = BLEND_FACTOR_TABLE[int(dstFac)]; } blDesc.RenderTarget[0].BlendOpAlpha = D3D11_BLEND_OP_ADD; } blDesc.RenderTarget[0].RenderTargetWriteMask = (colorWrite ? (D3D11_COLOR_WRITE_ENABLE_RED | D3D11_COLOR_WRITE_ENABLE_GREEN | D3D11_COLOR_WRITE_ENABLE_BLUE) : 0) | (alphaWrite ? D3D11_COLOR_WRITE_ENABLE_ALPHA : 0); ThrowIfFailed(ctx->m_dev->CreateBlendState(&blDesc, &m_blState)); const auto& vertBuf = m_vert.get().m_vtxBlob; D3D11VertexFormat* cvtxFmt = vtxFmt.cast(); ThrowIfFailed(ctx->m_dev->CreateInputLayout(cvtxFmt->m_elements.get(), cvtxFmt->m_elementCount, vertBuf->GetBufferPointer(), vertBuf->GetBufferSize(), &m_inLayout)); } public: ComPtr m_vShader; ComPtr m_pShader; ComPtr m_rasState; ComPtr m_dsState; ComPtr m_blState; ComPtr m_inLayout; D3D11_PRIMITIVE_TOPOLOGY m_topology; ~D3D11ShaderPipeline() = default; D3D11ShaderPipeline& operator=(const D3D11ShaderPipeline&) = delete; D3D11ShaderPipeline(const D3D11ShaderPipeline&) = delete; void bind(ID3D11DeviceContext* ctx) { ctx->VSSetShader(m_vShader.Get(), nullptr, 0); ctx->PSSetShader(m_pShader.Get(), nullptr, 0); ctx->RSSetState(m_rasState.Get()); ctx->OMSetDepthStencilState(m_dsState.Get(), 0); ctx->OMSetBlendState(m_blState.Get(), nullptr, 0xffffffff); ctx->IASetInputLayout(m_inLayout.Get()); ctx->IASetPrimitiveTopology(m_topology); } }; struct D3D11ShaderDataBinding : public GraphicsDataNode { boo::ObjToken m_pipeline; boo::ObjToken m_vbuf; boo::ObjToken m_instVbuf; boo::ObjToken m_ibuf; std::vector> m_ubufs; std::unique_ptr m_ubufFirstConsts; std::unique_ptr m_ubufNumConsts; std::unique_ptr m_pubufs; struct BoundTex { boo::ObjToken tex; int idx; bool depth; }; std::vector m_texs; UINT m_baseOffsets[2]; D3D11ShaderDataBinding(const boo::ObjToken& d, D3D11Context* ctx, const boo::ObjToken& pipeline, const boo::ObjToken& vbuf, const boo::ObjToken& instVbuf, const boo::ObjToken& ibuf, size_t ubufCount, const boo::ObjToken* ubufs, const PipelineStage* ubufStages, const size_t* ubufOffs, const size_t* ubufSizes, size_t texCount, const boo::ObjToken* texs, const int* texBindIdx, const bool* depthBind, size_t baseVert, size_t baseInst) : GraphicsDataNode(d), m_pipeline(pipeline), m_vbuf(vbuf), m_instVbuf(instVbuf), m_ibuf(ibuf) { m_ubufs.reserve(ubufCount); m_texs.reserve(texCount); D3D11ShaderPipeline* cpipeline = m_pipeline.cast(); D3D11VertexFormat* vtxFmt = cpipeline->m_vtxFmt.cast(); m_baseOffsets[0] = UINT(baseVert * vtxFmt->m_stride); m_baseOffsets[1] = UINT(baseInst * vtxFmt->m_instStride); if (ubufStages) { m_pubufs.reset(new bool[ubufCount]); for (size_t i=0 ; i()->bind(ctx); ID3D11Buffer* bufs[2] = {}; UINT strides[2] = {}; if (m_vbuf) { if (m_vbuf->dynamic()) { D3D11GraphicsBufferD* cbuf = m_vbuf.cast>(); bufs[0] = cbuf->m_bufs[b].Get(); strides[0] = UINT(cbuf->m_stride); } else { D3D11GraphicsBufferS* cbuf = m_vbuf.cast(); bufs[0] = cbuf->m_buf.Get(); strides[0] = UINT(cbuf->m_stride); } } if (m_instVbuf) { if (m_instVbuf->dynamic()) { D3D11GraphicsBufferD* cbuf = m_instVbuf.cast>(); bufs[1] = cbuf->m_bufs[b].Get(); strides[1] = UINT(cbuf->m_stride); } else { D3D11GraphicsBufferS* cbuf = m_instVbuf.cast(); bufs[1] = cbuf->m_buf.Get(); strides[1] = UINT(cbuf->m_stride); } } ctx->IASetVertexBuffers(0, 2, bufs, strides, m_baseOffsets); if (m_ibuf) { if (m_ibuf->dynamic()) { D3D11GraphicsBufferD* cbuf = m_ibuf.cast>(); ctx->IASetIndexBuffer(cbuf->m_bufs[b].Get(), DXGI_FORMAT_R32_UINT, 0); } else { D3D11GraphicsBufferS* cbuf = m_ibuf.cast(); ctx->IASetIndexBuffer(cbuf->m_buf.Get(), DXGI_FORMAT_R32_UINT, 0); } } if (m_ubufs.size()) { if (m_ubufFirstConsts) { ID3D11Buffer* constBufs[8] = {}; ctx->VSSetConstantBuffers(0, m_ubufs.size(), constBufs); for (int i=0 ; i<8 && idynamic()) { D3D11GraphicsBufferD* cbuf = m_ubufs[i].cast>(); constBufs[i] = cbuf->m_bufs[b].Get(); } else { D3D11GraphicsBufferS* cbuf = m_ubufs[i].cast(); constBufs[i] = cbuf->m_buf.Get(); } } ctx->VSSetConstantBuffers1(0, m_ubufs.size(), constBufs, m_ubufFirstConsts.get(), m_ubufNumConsts.get()); if (m_pubufs) { ID3D11Buffer* constBufs[8] = {}; ctx->PSSetConstantBuffers(0, m_ubufs.size(), constBufs); for (int i=0 ; i<8 && idynamic()) { D3D11GraphicsBufferD* cbuf = m_ubufs[i].cast>(); constBufs[i] = cbuf->m_bufs[b].Get(); } else { D3D11GraphicsBufferS* cbuf = m_ubufs[i].cast(); constBufs[i] = cbuf->m_buf.Get(); } } ctx->PSSetConstantBuffers1(0, m_ubufs.size(), constBufs, m_ubufFirstConsts.get(), m_ubufNumConsts.get()); } } else { ID3D11Buffer* constBufs[8] = {}; for (int i=0 ; i<8 && idynamic()) { D3D11GraphicsBufferD* cbuf = m_ubufs[i].cast>(); constBufs[i] = cbuf->m_bufs[b].Get(); } else { D3D11GraphicsBufferS* cbuf = m_ubufs[i].cast(); constBufs[i] = cbuf->m_buf.Get(); } } ctx->VSSetConstantBuffers(0, m_ubufs.size(), constBufs); if (m_pubufs) { ID3D11Buffer* constBufs[8] = {}; for (int i=0 ; i<8 && idynamic()) { D3D11GraphicsBufferD* cbuf = m_ubufs[i].cast>(); constBufs[i] = cbuf->m_bufs[b].Get(); } else { D3D11GraphicsBufferS* cbuf = m_ubufs[i].cast(); constBufs[i] = cbuf->m_buf.Get(); } } ctx->PSSetConstantBuffers(0, m_ubufs.size(), constBufs); } } } if (m_texs.size()) { ID3D11ShaderResourceView* srvs[8] = {}; for (int i=0 ; i<8 && itype()) { case TextureType::Dynamic: { D3D11TextureD* ctex = m_texs[i].tex.cast(); srvs[i] = ctex->m_srvs[b].Get(); break; } case TextureType::Static: { D3D11TextureS* ctex = m_texs[i].tex.cast(); srvs[i] = ctex->m_srv.Get(); break; } case TextureType::StaticArray: { D3D11TextureSA* ctex = m_texs[i].tex.cast(); srvs[i] = ctex->m_srv.Get(); break; } case TextureType::Render: { D3D11TextureR* ctex = m_texs[i].tex.cast(); srvs[i] = m_texs[i].depth ? ctex->m_depthSrv[m_texs[i].idx].Get() : ctex->m_colorSrv[m_texs[i].idx].Get(); break; } } } } ctx->PSSetShaderResources(0, m_texs.size(), srvs); } } }; struct D3D11CommandQueue : IGraphicsCommandQueue { Platform platform() const {return IGraphicsDataFactory::Platform::D3D11;} const SystemChar* platformName() const {return _S("D3D11");} D3D11Context* m_ctx; D3D11Context::Window* m_windowCtx; IGraphicsContext* m_parent; ComPtr m_deferredCtx; size_t m_fillBuf = 0; size_t m_completeBuf = 0; size_t m_drawBuf = 0; bool m_running = true; std::mutex m_mt; std::condition_variable m_cv; std::mutex m_initmt; std::condition_variable m_initcv; std::unique_lock m_initlk; std::thread m_thr; struct CommandList { ComPtr list; std::vector> resTokens; boo::ObjToken workDoPresent; void reset() { list.Reset(); resTokens.clear(); workDoPresent.reset(); } }; CommandList m_cmdLists[3]; std::recursive_mutex m_dynamicLock; void ProcessDynamicLoads(ID3D11DeviceContext* ctx); static void RenderingWorker(D3D11CommandQueue* self); D3D11CommandQueue(D3D11Context* ctx, D3D11Context::Window* windowCtx, IGraphicsContext* parent) : m_ctx(ctx), m_windowCtx(windowCtx), m_parent(parent), m_initlk(m_initmt), m_thr(RenderingWorker, this) { m_initcv.wait(m_initlk); m_initlk.unlock(); ThrowIfFailed(ctx->m_dev->CreateDeferredContext1(0, &m_deferredCtx)); } void startRenderer(); void stopRenderer() { m_running = false; m_cv.notify_one(); m_thr.join(); } ~D3D11CommandQueue() { if (m_running) stopRenderer(); } void setShaderDataBinding(const boo::ObjToken& binding) { D3D11ShaderDataBinding* cbind = binding.cast(); cbind->bind(m_deferredCtx.Get(), m_fillBuf); m_cmdLists[m_fillBuf].resTokens.push_back(binding.get()); ID3D11SamplerState* samp[] = {m_ctx->m_ss[0].Get(), m_ctx->m_ss[1].Get(), m_ctx->m_ss[2].Get(), m_ctx->m_ss[3].Get()}; m_deferredCtx->PSSetSamplers(0, 4, samp); } boo::ObjToken m_boundTarget; void setRenderTarget(const boo::ObjToken& target) { D3D11TextureR* ctarget = target.cast(); ID3D11RenderTargetView* view[] = {ctarget->m_rtv.Get()}; m_deferredCtx->OMSetRenderTargets(1, view, ctarget->m_dsv.Get()); m_boundTarget = target; } void setViewport(const SWindowRect& rect, float znear, float zfar) { if (m_boundTarget) { D3D11TextureR* ctarget = m_boundTarget.cast(); int boundHeight = ctarget->m_height; D3D11_VIEWPORT vp = {FLOAT(rect.location[0]), FLOAT(boundHeight - rect.location[1] - rect.size[1]), FLOAT(rect.size[0]), FLOAT(rect.size[1]), 1.f - zfar, 1.f - znear}; m_deferredCtx->RSSetViewports(1, &vp); } } void setScissor(const SWindowRect& rect) { if (m_boundTarget) { D3D11TextureR* ctarget = m_boundTarget.cast(); int boundHeight = ctarget->m_height; D3D11_RECT d3drect = {LONG(rect.location[0]), LONG(boundHeight - rect.location[1] - rect.size[1]), LONG(rect.location[0] + rect.size[0]), LONG(boundHeight - rect.location[1])}; m_deferredCtx->RSSetScissorRects(1, &d3drect); } } std::unordered_map> m_texResizes; void resizeRenderTexture(const boo::ObjToken& tex, size_t width, size_t height) { D3D11TextureR* ctex = tex.cast(); std::unique_lock lk(m_mt); m_texResizes[ctex] = std::make_pair(width, height); } void schedulePostFrameHandler(std::function&& func) { func(); } float m_clearColor[4] = {0.0,0.0,0.0,0.0}; void setClearColor(const float rgba[4]) { m_clearColor[0] = rgba[0]; m_clearColor[1] = rgba[1]; m_clearColor[2] = rgba[2]; m_clearColor[3] = rgba[3]; } void clearTarget(bool render=true, bool depth=true) { if (!m_boundTarget) return; D3D11TextureR* ctarget = m_boundTarget.cast(); if (render) m_deferredCtx->ClearRenderTargetView(ctarget->m_rtv.Get(), m_clearColor); if (depth) m_deferredCtx->ClearDepthStencilView(ctarget->m_dsv.Get(), D3D11_CLEAR_DEPTH, 0.0f, 0); } void draw(size_t start, size_t count) { m_deferredCtx->Draw(count, start); } void drawIndexed(size_t start, size_t count) { m_deferredCtx->DrawIndexed(count, start, 0); } void drawInstances(size_t start, size_t count, size_t instCount) { m_deferredCtx->DrawInstanced(count, instCount, start, 0); } void drawInstancesIndexed(size_t start, size_t count, size_t instCount) { m_deferredCtx->DrawIndexedInstanced(count, instCount, start, 0, 0); } void _resolveBindTexture(ID3D11DeviceContext1* ctx, const D3D11TextureR* tex, const SWindowRect& rect, bool tlOrigin, int bindIdx, bool color, bool depth) { if (color && tex->m_colorBindCount) { if (tex->m_samples > 1) { ctx->ResolveSubresource(tex->m_colorBindTex[bindIdx].Get(), 0, tex->m_colorTex.Get(), 0, m_ctx->m_fbFormat); } else { SWindowRect intersectRect = rect.intersect(SWindowRect(0, 0, tex->m_width, tex->m_height)); int y = tlOrigin ? intersectRect.location[1] : (tex->m_height - intersectRect.size[1] - intersectRect.location[1]); D3D11_BOX box = {UINT(intersectRect.location[0]), UINT(y), 0, UINT(intersectRect.location[0] + intersectRect.size[0]), UINT(y + intersectRect.size[1]), 1}; ctx->CopySubresourceRegion1(tex->m_colorBindTex[bindIdx].Get(), 0, box.left, box.top, 0, tex->m_colorTex.Get(), 0, &box, D3D11_COPY_DISCARD); } } if (depth && tex->m_depthBindCount) { if (tex->m_samples > 1) { ctx->ResolveSubresource(tex->m_depthBindTex[bindIdx].Get(), 0, tex->m_depthTex.Get(), 0, DXGI_FORMAT_D32_FLOAT); } else { ctx->CopyResource(tex->m_depthBindTex[bindIdx].Get(), tex->m_depthTex.Get()); } } } void resolveBindTexture(const boo::ObjToken& texture, const SWindowRect& rect, bool tlOrigin, int bindIdx, bool color, bool depth, bool clearDepth) { const D3D11TextureR* tex = texture.cast(); _resolveBindTexture(m_deferredCtx.Get(), tex, rect, tlOrigin, bindIdx, color, depth); if (clearDepth) m_deferredCtx->ClearDepthStencilView(tex->m_dsv.Get(), D3D11_CLEAR_DEPTH, 0.0f, 0); } boo::ObjToken m_doPresent; void resolveDisplay(const boo::ObjToken& source) { m_doPresent = source; } void execute(); }; template void D3D11GraphicsBufferD::update(ID3D11DeviceContext* ctx, int b) { int slot = 1 << b; if ((slot & m_validSlots) == 0) { ID3D11Buffer* res = m_bufs[b].Get(); D3D11_MAPPED_SUBRESOURCE d; if (SUCCEEDED(ctx->Map(res, 0, D3D11_MAP_WRITE_DISCARD, 0, &d))) { memcpy(d.pData, m_cpuBuf.get(), m_cpuSz); ctx->Unmap(res, 0); } m_validSlots |= slot; } } template void D3D11GraphicsBufferD::load(const void* data, size_t sz) { std::unique_lock lk(m_q->m_dynamicLock); size_t bufSz = std::min(sz, m_cpuSz); memcpy(m_cpuBuf.get(), data, bufSz); m_validSlots = 0; } template void* D3D11GraphicsBufferD::map(size_t sz) { if (sz > m_cpuSz) return nullptr; m_q->m_dynamicLock.lock(); return m_cpuBuf.get(); } template void D3D11GraphicsBufferD::unmap() { m_validSlots = 0; m_q->m_dynamicLock.unlock(); } void D3D11TextureD::update(ID3D11DeviceContext* ctx, int b) { int slot = 1 << b; if ((slot & m_validSlots) == 0) { ID3D11Texture2D* res = m_texs[b].Get(); D3D11_MAPPED_SUBRESOURCE d; ctx->Map(res, 0, D3D11_MAP_WRITE_DISCARD, 0, &d); size_t rowSz = m_pxPitch * m_width; for (size_t i=0 ; i(d.pData)+=d.RowPitch) memmove(d.pData, m_cpuBuf.get() + i, rowSz); ctx->Unmap(res, 0); m_validSlots |= slot; } } void D3D11TextureD::load(const void* data, size_t sz) { std::unique_lock lk(m_q->m_dynamicLock); size_t bufSz = std::min(sz, m_cpuSz); memcpy(m_cpuBuf.get(), data, bufSz); m_validSlots = 0; } void* D3D11TextureD::map(size_t sz) { if (sz > m_cpuSz) return nullptr; m_q->m_dynamicLock.lock(); return m_cpuBuf.get(); } void D3D11TextureD::unmap() { m_validSlots = 0; m_q->m_dynamicLock.unlock(); } class D3D11DataFactory : public D3DDataFactory, public GraphicsDataFactoryHead { friend struct D3D11CommandQueue; IGraphicsContext* m_parent; struct D3D11Context* m_ctx; std::unordered_map> m_sharedShaders; std::unordered_map m_sourceToBinary; float m_gamma = 1.f; ObjToken m_gammaShader; ObjToken m_gammaLUT; ObjToken m_gammaVBO; ObjToken m_gammaVFMT; ObjToken m_gammaBinding; void SetupGammaResources() { commitTransaction([this](IGraphicsDataFactory::Context& ctx) { const VertexElementDescriptor vfmt[] = { {nullptr, nullptr, VertexSemantic::Position4}, {nullptr, nullptr, VertexSemantic::UV4} }; m_gammaVFMT = ctx.newVertexFormat(2, vfmt); m_gammaShader = static_cast(ctx).newShaderPipeline(GammaVS, GammaFS, nullptr, nullptr, nullptr, m_gammaVFMT, BlendFactor::One, BlendFactor::Zero, Primitive::TriStrips, ZTest::None, false, true, false, CullMode::None, true); m_gammaLUT = ctx.newDynamicTexture(256, 256, TextureFormat::I16, TextureClampMode::ClampToEdge); setDisplayGamma(1.f); const struct Vert { float pos[4]; float uv[4]; } verts[4] = { {{-1.f, 1.f, 0.f, 1.f}, {0.f, 0.f, 0.f, 0.f}}, {{ 1.f, 1.f, 0.f, 1.f}, {1.f, 0.f, 0.f, 0.f}}, {{-1.f, -1.f, 0.f, 1.f}, {0.f, 1.f, 0.f, 0.f}}, {{ 1.f, -1.f, 0.f, 1.f}, {1.f, 1.f, 0.f, 0.f}} }; m_gammaVBO = ctx.newStaticBuffer(BufferUse::Vertex, verts, 32, 4); ObjToken texs[] = {{}, m_gammaLUT.get()}; m_gammaBinding = ctx.newShaderDataBinding(m_gammaShader, m_gammaVFMT, m_gammaVBO.get(), {}, {}, 0, nullptr, nullptr, 2, texs, nullptr, nullptr); return true; } BooTrace); } public: D3D11DataFactory(IGraphicsContext* parent, D3D11Context* ctx) : m_parent(parent), m_ctx(ctx) { UINT qLevels; while (SUCCEEDED(ctx->m_dev->CheckMultisampleQualityLevels (m_ctx->m_fbFormat, m_ctx->m_sampleCount, &qLevels)) && !qLevels) m_ctx->m_sampleCount = flp2(m_ctx->m_sampleCount - 1); } Platform platform() const {return Platform::D3D11;} const SystemChar* platformName() const {return _S("D3D11");} class Context : public D3DDataFactory::Context { friend class D3D11DataFactory; D3D11DataFactory& m_parent; boo::ObjToken m_data; Context(D3D11DataFactory& parent __BooTraceArgs) : m_parent(parent), m_data(new BaseGraphicsData(parent __BooTraceArgsUse)) {} public: Platform platform() const {return Platform::D3D11;} const SystemChar* platformName() const {return _S("D3D11");} boo::ObjToken newStaticBuffer(BufferUse use, const void* data, size_t stride, size_t count) { return {new D3D11GraphicsBufferS(m_data, use, m_parent.m_ctx, data, stride, count)}; } boo::ObjToken newDynamicBuffer(BufferUse use, size_t stride, size_t count) { D3D11CommandQueue* q = static_cast(m_parent.m_parent->getCommandQueue()); return {new D3D11GraphicsBufferD(m_data, q, use, m_parent.m_ctx, stride, count)}; } boo::ObjToken newStaticTexture(size_t width, size_t height, size_t mips, TextureFormat fmt, TextureClampMode clampMode, const void* data, size_t sz) { return {new D3D11TextureS(m_data, m_parent.m_ctx, width, height, mips, fmt, data, sz)}; } boo::ObjToken newStaticArrayTexture(size_t width, size_t height, size_t layers, size_t mips, TextureFormat fmt, TextureClampMode clampMode, const void* data, size_t sz) { return {new D3D11TextureSA(m_data, m_parent.m_ctx, width, height, layers, mips, fmt, data, sz)}; } boo::ObjToken newDynamicTexture(size_t width, size_t height, TextureFormat fmt, TextureClampMode clampMode) { D3D11CommandQueue* q = static_cast(m_parent.m_parent->getCommandQueue()); return {new D3D11TextureD(m_data, q, m_parent.m_ctx, width, height, fmt)}; } boo::ObjToken newRenderTexture(size_t width, size_t height, TextureClampMode clampMode, size_t colorBindCount, size_t depthBindCount) { return {new D3D11TextureR(m_data, m_parent.m_ctx, width, height, m_parent.m_ctx->m_sampleCount, colorBindCount, depthBindCount)}; } boo::ObjToken newVertexFormat(size_t elementCount, const VertexElementDescriptor* elements, size_t baseVert, size_t baseInst) { return {new struct D3D11VertexFormat(m_data, elementCount, elements)}; } #if _DEBUG && 0 #define BOO_D3DCOMPILE_FLAG D3DCOMPILE_DEBUG | D3DCOMPILE_OPTIMIZATION_LEVEL0 #else #define BOO_D3DCOMPILE_FLAG D3DCOMPILE_OPTIMIZATION_LEVEL3 #endif static uint64_t CompileVert(ComPtr& vertBlobOut, const char* vertSource, uint64_t srcKey, D3D11DataFactory& factory) { ComPtr errBlob; if (FAILED(D3DCompilePROC(vertSource, strlen(vertSource), "HECL Vert Source", nullptr, nullptr, "main", "vs_5_0", BOO_D3DCOMPILE_FLAG, 0, &vertBlobOut, &errBlob))) { printf("%s\n", vertSource); Log.report(logvisor::Fatal, "error compiling vert shader: %s", errBlob->GetBufferPointer()); } XXH64_state_t hashState; XXH64_reset(&hashState, 0); XXH64_update(&hashState, vertBlobOut->GetBufferPointer(), vertBlobOut->GetBufferSize()); uint64_t binKey = XXH64_digest(&hashState); factory.m_sourceToBinary[srcKey] = binKey; return binKey; } static uint64_t CompileFrag(ComPtr& fragBlobOut, const char* fragSource, uint64_t srcKey, D3D11DataFactory& factory) { ComPtr errBlob; if (FAILED(D3DCompilePROC(fragSource, strlen(fragSource), "HECL Pixel Source", nullptr, nullptr, "main", "ps_5_0", BOO_D3DCOMPILE_FLAG, 0, &fragBlobOut, &errBlob))) { printf("%s\n", fragSource); Log.report(logvisor::Fatal, "error compiling pixel shader: %s", errBlob->GetBufferPointer()); } XXH64_state_t hashState; XXH64_reset(&hashState, 0); XXH64_update(&hashState, fragBlobOut->GetBufferPointer(), fragBlobOut->GetBufferSize()); uint64_t binKey = XXH64_digest(&hashState); factory.m_sourceToBinary[srcKey] = binKey; return binKey; } boo::ObjToken newShaderPipeline (const char* vertSource, const char* fragSource, ComPtr* vertBlobOut, ComPtr* fragBlobOut, ComPtr* pipelineBlob, const boo::ObjToken& vtxFmt, BlendFactor srcFac, BlendFactor dstFac, Primitive prim, ZTest depthTest, bool depthWrite, bool colorWrite, bool alphaWrite, CullMode culling, bool overwriteAlpha) { XXH64_state_t hashState; uint64_t srcHashes[2] = {}; uint64_t binHashes[2] = {}; XXH64_reset(&hashState, 0); if (vertSource) { XXH64_update(&hashState, vertSource, strlen(vertSource)); srcHashes[0] = XXH64_digest(&hashState); auto binSearch = m_parent.m_sourceToBinary.find(srcHashes[0]); if (binSearch != m_parent.m_sourceToBinary.cend()) binHashes[0] = binSearch->second; } else if (vertBlobOut && *vertBlobOut) { XXH64_update(&hashState, (*vertBlobOut)->GetBufferPointer(), (*vertBlobOut)->GetBufferSize()); binHashes[0] = XXH64_digest(&hashState); } XXH64_reset(&hashState, 0); if (fragSource) { XXH64_update(&hashState, fragSource, strlen(fragSource)); srcHashes[1] = XXH64_digest(&hashState); auto binSearch = m_parent.m_sourceToBinary.find(srcHashes[1]); if (binSearch != m_parent.m_sourceToBinary.cend()) binHashes[1] = binSearch->second; } else if (fragBlobOut && *fragBlobOut) { XXH64_update(&hashState, (*fragBlobOut)->GetBufferPointer(), (*fragBlobOut)->GetBufferSize()); binHashes[1] = XXH64_digest(&hashState); } if (vertBlobOut && !*vertBlobOut) binHashes[0] = CompileVert(*vertBlobOut, vertSource, srcHashes[0], m_parent); if (fragBlobOut && !*fragBlobOut) binHashes[1] = CompileFrag(*fragBlobOut, fragSource, srcHashes[1], m_parent); struct D3D11Context* ctx = m_parent.m_ctx; D3D11ShareableShader::Token vertShader; D3D11ShareableShader::Token fragShader; auto vertFind = binHashes[0] ? m_parent.m_sharedShaders.find(binHashes[0]) : m_parent.m_sharedShaders.end(); if (vertFind != m_parent.m_sharedShaders.end()) { vertShader = vertFind->second->lock(); } else { ComPtr vertBlob; if (vertBlobOut) vertBlob = *vertBlobOut; else binHashes[0] = CompileVert(vertBlob, vertSource, srcHashes[0], m_parent); ComPtr vShader; ThrowIfFailed(ctx->m_dev->CreateVertexShader(vertBlob->GetBufferPointer(), vertBlob->GetBufferSize(), nullptr, &vShader)); auto it = m_parent.m_sharedShaders.emplace(std::make_pair(binHashes[0], std::make_unique(m_parent, srcHashes[0], binHashes[0], std::move(vShader), std::move(vertBlob)))).first; vertShader = it->second->lock(); } auto fragFind = binHashes[1] ? m_parent.m_sharedShaders.find(binHashes[1]) : m_parent.m_sharedShaders.end(); if (fragFind != m_parent.m_sharedShaders.end()) { fragShader = fragFind->second->lock(); } else { ComPtr fragBlob; ComPtr* useFragBlob; if (fragBlobOut) { useFragBlob = fragBlobOut; } else { useFragBlob = &fragBlob; binHashes[1] = CompileFrag(fragBlob, fragSource, srcHashes[1], m_parent); } ComPtr pShader; ThrowIfFailed(ctx->m_dev->CreatePixelShader((*useFragBlob)->GetBufferPointer(), (*useFragBlob)->GetBufferSize(), nullptr, &pShader)); auto it = m_parent.m_sharedShaders.emplace(std::make_pair(binHashes[1], std::make_unique(m_parent, srcHashes[1], binHashes[1], std::move(pShader)))).first; fragShader = it->second->lock(); } return {new D3D11ShaderPipeline(m_data, ctx, std::move(vertShader), std::move(fragShader), vtxFmt, srcFac, dstFac, prim, depthTest, depthWrite, colorWrite, alphaWrite, overwriteAlpha, culling)}; } boo::ObjToken newShaderDataBinding( const boo::ObjToken& pipeline, const boo::ObjToken& vtxFormat, const boo::ObjToken& vbuf, const boo::ObjToken& instVbo, const boo::ObjToken& ibuf, size_t ubufCount, const boo::ObjToken* ubufs, const PipelineStage* ubufStages, const size_t* ubufOffs, const size_t* ubufSizes, size_t texCount, const boo::ObjToken* texs, const int* texBindIdx, const bool* depthBind, size_t baseVert, size_t baseInst) { return {new D3D11ShaderDataBinding(m_data, m_parent.m_ctx, pipeline, vbuf, instVbo, ibuf, ubufCount, ubufs, ubufStages, ubufOffs, ubufSizes, texCount, texs, texBindIdx, depthBind, baseVert, baseInst)}; } }; boo::ObjToken newPoolBuffer(BufferUse use, size_t stride, size_t count __BooTraceArgs) { D3D11CommandQueue* q = static_cast(m_parent->getCommandQueue()); boo::ObjToken pool(new BaseGraphicsPool(*this __BooTraceArgsUse)); return {new D3D11GraphicsBufferD(pool, q, use, m_ctx, stride, count)}; } void commitTransaction(const FactoryCommitFunc& trans __BooTraceArgs) { D3D11DataFactory::Context ctx(*this __BooTraceArgsUse); trans(ctx); } void _unregisterShareableShader(uint64_t srcKey, uint64_t binKey) { if (srcKey) m_sourceToBinary.erase(srcKey); m_sharedShaders.erase(binKey); } void setDisplayGamma(float gamma) { if (m_ctx->m_fbFormat == DXGI_FORMAT_R16G16B16A16_FLOAT) m_gamma = gamma * 2.2f; else m_gamma = gamma; if (m_gamma != 1.f) UpdateGammaLUT(m_gammaLUT.get(), m_gamma); } }; void D3D11CommandQueue::RenderingWorker(D3D11CommandQueue* self) { { std::unique_lock lk(self->m_initmt); } self->m_initcv.notify_one(); D3D11DataFactory* dataFactory = static_cast(self->m_parent->getDataFactory()); while (self->m_running) { { std::unique_lock lk(self->m_mt); self->m_cv.wait(lk); if (!self->m_running) break; self->m_drawBuf = self->m_completeBuf; auto& CmdList = self->m_cmdLists[self->m_drawBuf]; self->ProcessDynamicLoads(self->m_ctx->m_devCtx.Get()); if (self->m_texResizes.size()) { for (const auto& resize : self->m_texResizes) resize.first->resize(self->m_ctx, resize.second.first, resize.second.second); self->m_texResizes.clear(); CmdList.reset(); continue; } if (self->m_windowCtx->m_needsFSTransition) { if (self->m_windowCtx->m_fs) { self->m_windowCtx->m_swapChain->SetFullscreenState(true, nullptr); self->m_windowCtx->m_swapChain->ResizeTarget(&self->m_windowCtx->m_fsdesc); } else self->m_windowCtx->m_swapChain->SetFullscreenState(false, nullptr); self->m_windowCtx->m_needsFSTransition = false; CmdList.reset(); continue; } if (self->m_windowCtx->m_needsResize) { self->m_windowCtx->clearRTV(); self->m_windowCtx->m_swapChain->ResizeBuffers(2, self->m_windowCtx->width, self->m_windowCtx->height, self->m_ctx->m_fbFormat, DXGI_SWAP_CHAIN_FLAG_ALLOW_MODE_SWITCH); self->m_windowCtx->setupRTV(self->m_windowCtx->m_swapChain, self->m_ctx->m_dev.Get()); self->m_windowCtx->m_needsResize = false; CmdList.reset(); continue; } } auto& CmdList = self->m_cmdLists[self->m_drawBuf]; ID3D11CommandList* list = CmdList.list.Get(); self->m_ctx->m_devCtx->ExecuteCommandList(list, false); if (D3D11TextureR* csource = CmdList.workDoPresent.cast()) { #ifndef NDEBUG if (!csource->m_colorBindCount) Log.report(logvisor::Fatal, "texture provided to resolveDisplay() must have at least 1 color binding"); #endif if (dataFactory->m_gamma != 1.f) { SWindowRect rect(0, 0, csource->m_width, csource->m_height); self->_resolveBindTexture(self->m_ctx->m_devCtx.Get(), csource, rect, true, 0, true, false); ID3D11RenderTargetView* rtv = self->m_windowCtx->m_swapChainRTV.Get(); self->m_ctx->m_devCtx->OMSetRenderTargets(1, &rtv, nullptr); D3D11_VIEWPORT vp = {0.f, 0.f, FLOAT(csource->m_width), FLOAT(csource->m_height), 0.f, 1.f}; self->m_ctx->m_devCtx->RSSetViewports(1, &vp); D3D11_RECT d3drect = {0, 0, LONG(csource->m_width), LONG(csource->m_height)}; self->m_ctx->m_devCtx->RSSetScissorRects(1, &d3drect); ID3D11SamplerState* samp[] = {self->m_ctx->m_ss[0].Get(), self->m_ctx->m_ss[1].Get(), self->m_ctx->m_ss[2].Get(), self->m_ctx->m_ss[3].Get()}; self->m_ctx->m_devCtx->PSSetSamplers(0, 4, samp); D3D11ShaderDataBinding* gammaBinding = dataFactory->m_gammaBinding.cast(); gammaBinding->m_texs[0].tex = CmdList.workDoPresent.get(); gammaBinding->bind(self->m_ctx->m_devCtx.Get(), self->m_drawBuf); self->m_ctx->m_devCtx->Draw(4, 0); gammaBinding->m_texs[0].tex.reset(); } else { ComPtr dest = self->m_windowCtx->m_swapChainTex; ID3D11Texture2D* src = csource->m_colorTex.Get(); if (csource->m_samples > 1) self->m_ctx->m_devCtx->ResolveSubresource(dest.Get(), 0, src, 0, self->m_ctx->m_fbFormat); else self->m_ctx->m_devCtx->CopyResource(dest.Get(), src); } self->m_windowCtx->m_swapChain->Present(1, 0); } CmdList.reset(); } } void D3D11CommandQueue::startRenderer() { static_cast(m_parent->getDataFactory())->SetupGammaResources(); } void D3D11CommandQueue::execute() { /* Finish command list */ auto& CmdList = m_cmdLists[m_fillBuf]; ThrowIfFailed(m_deferredCtx->FinishCommandList(false, &CmdList.list)); CmdList.workDoPresent = m_doPresent; m_doPresent = nullptr; /* Wait for worker thread to become ready */ std::unique_lock lk(m_mt); /* Ready for next frame */ m_completeBuf = m_fillBuf; for (size_t i=0 ; i<3 ; ++i) { if (i == m_completeBuf || i == m_drawBuf) continue; m_fillBuf = i; break; } /* Return control to worker thread */ lk.unlock(); m_cv.notify_one(); } void D3D11CommandQueue::ProcessDynamicLoads(ID3D11DeviceContext* ctx) { D3D11DataFactory* gfxF = static_cast(m_parent->getDataFactory()); std::unique_lock lk(m_dynamicLock); std::unique_lock datalk(gfxF->m_dataMutex); if (gfxF->m_dataHead) { for (BaseGraphicsData& d : *gfxF->m_dataHead) { if (d.m_DBufs) for (IGraphicsBufferD& b : *d.m_DBufs) static_cast&>(b).update(ctx, m_drawBuf); if (d.m_DTexs) for (ITextureD& t : *d.m_DTexs) static_cast(t).update(ctx, m_drawBuf); } } if (gfxF->m_poolHead) { for (BaseGraphicsPool& p : *gfxF->m_poolHead) { if (p.m_DBufs) for (IGraphicsBufferD& b : *p.m_DBufs) static_cast&>(b).update(ctx, m_drawBuf); } } } std::unique_ptr _NewD3D11CommandQueue(D3D11Context* ctx, D3D11Context::Window* windowCtx, IGraphicsContext* parent) { return std::make_unique(ctx, windowCtx, parent); } std::unique_ptr _NewD3D11DataFactory(D3D11Context* ctx, IGraphicsContext* parent) { return std::make_unique(parent, ctx); } }