Add Metal vertex pulling behind a flag

Implements vertex pulling on the Metal backend, hidden behind a flag until ready for use (we are missing support for more complicated vertex input types). Bug: dawn:480 Change-Id: I38028b80673693ebf21309ad5336561fb99f40dc Reviewed-on: https://dawn-review.googlesource.com/c/dawn/+/26522 Commit-Queue: Idan Raiter <idanr@google.com> Reviewed-by: Austin Eng <enga@chromium.org>
2025-07-15 17:45:58 +00:00 · 2020-08-13 23:53:59 +00:00 · 2020-08-13 23:53:59 +00:00 · d315022be5
commit d315022be5
parent e1604b9a64
13 changed files with 515 additions and 23 deletions
--- a/src/dawn_native/ShaderModule.cpp
+++ b/src/dawn_native/ShaderModule.cpp
@ -295,6 +295,82 @@ namespace dawn_native {
                    << " binding " << static_cast<uint32_t>(binding);
            return ostream.str();
        }
+
+#ifdef DAWN_ENABLE_WGSL
+        tint::ast::transform::VertexFormat ToTintVertexFormat(wgpu::VertexFormat format) {
+            switch (format) {
+                case wgpu::VertexFormat::UChar2:
+                    return tint::ast::transform::VertexFormat::kVec2U8;
+                case wgpu::VertexFormat::UChar4:
+                    return tint::ast::transform::VertexFormat::kVec4U8;
+                case wgpu::VertexFormat::Char2:
+                    return tint::ast::transform::VertexFormat::kVec2I8;
+                case wgpu::VertexFormat::Char4:
+                    return tint::ast::transform::VertexFormat::kVec4I8;
+                case wgpu::VertexFormat::UChar2Norm:
+                    return tint::ast::transform::VertexFormat::kVec2U8Norm;
+                case wgpu::VertexFormat::UChar4Norm:
+                    return tint::ast::transform::VertexFormat::kVec4U8Norm;
+                case wgpu::VertexFormat::Char2Norm:
+                    return tint::ast::transform::VertexFormat::kVec2I8Norm;
+                case wgpu::VertexFormat::Char4Norm:
+                    return tint::ast::transform::VertexFormat::kVec4I8Norm;
+                case wgpu::VertexFormat::UShort2:
+                    return tint::ast::transform::VertexFormat::kVec2U16;
+                case wgpu::VertexFormat::UShort4:
+                    return tint::ast::transform::VertexFormat::kVec4U16;
+                case wgpu::VertexFormat::Short2:
+                    return tint::ast::transform::VertexFormat::kVec2I16;
+                case wgpu::VertexFormat::Short4:
+                    return tint::ast::transform::VertexFormat::kVec4I16;
+                case wgpu::VertexFormat::UShort2Norm:
+                    return tint::ast::transform::VertexFormat::kVec2U16Norm;
+                case wgpu::VertexFormat::UShort4Norm:
+                    return tint::ast::transform::VertexFormat::kVec4U16Norm;
+                case wgpu::VertexFormat::Short2Norm:
+                    return tint::ast::transform::VertexFormat::kVec2I16Norm;
+                case wgpu::VertexFormat::Short4Norm:
+                    return tint::ast::transform::VertexFormat::kVec4I16Norm;
+                case wgpu::VertexFormat::Half2:
+                    return tint::ast::transform::VertexFormat::kVec2F16;
+                case wgpu::VertexFormat::Half4:
+                    return tint::ast::transform::VertexFormat::kVec4F16;
+                case wgpu::VertexFormat::Float:
+                    return tint::ast::transform::VertexFormat::kF32;
+                case wgpu::VertexFormat::Float2:
+                    return tint::ast::transform::VertexFormat::kVec2F32;
+                case wgpu::VertexFormat::Float3:
+                    return tint::ast::transform::VertexFormat::kVec3F32;
+                case wgpu::VertexFormat::Float4:
+                    return tint::ast::transform::VertexFormat::kVec4F32;
+                case wgpu::VertexFormat::UInt:
+                    return tint::ast::transform::VertexFormat::kU32;
+                case wgpu::VertexFormat::UInt2:
+                    return tint::ast::transform::VertexFormat::kVec2U32;
+                case wgpu::VertexFormat::UInt3:
+                    return tint::ast::transform::VertexFormat::kVec3U32;
+                case wgpu::VertexFormat::UInt4:
+                    return tint::ast::transform::VertexFormat::kVec4U32;
+                case wgpu::VertexFormat::Int:
+                    return tint::ast::transform::VertexFormat::kI32;
+                case wgpu::VertexFormat::Int2:
+                    return tint::ast::transform::VertexFormat::kVec2I32;
+                case wgpu::VertexFormat::Int3:
+                    return tint::ast::transform::VertexFormat::kVec3I32;
+                case wgpu::VertexFormat::Int4:
+                    return tint::ast::transform::VertexFormat::kVec4I32;
+            }
+        }
+
+        tint::ast::transform::InputStepMode ToTintInputStepMode(wgpu::InputStepMode mode) {
+            switch (mode) {
+                case wgpu::InputStepMode::Vertex:
+                    return tint::ast::transform::InputStepMode::kVertex;
+                case wgpu::InputStepMode::Instance:
+                    return tint::ast::transform::InputStepMode::kInstance;
+            }
+        }
+#endif
    }  // anonymous namespace

    MaybeError ValidateSpirv(DeviceBase*, const uint32_t* code, uint32_t codeSize) {
@ -400,6 +476,75 @@ namespace dawn_native {
        std::vector<uint32_t> spirv = generator.result();
        return std::move(spirv);
    }
+
+    ResultOrError<std::vector<uint32_t>> ConvertWGSLToSPIRVWithPulling(
+        const char* source,
+        const VertexStateDescriptor& vertexState,
+        const std::string& entryPoint,
+        uint32_t pullingBufferBindingSet) {
+        std::ostringstream errorStream;
+        errorStream << "Tint WGSL->SPIR-V failure:" << std::endl;
+
+        tint::Context context;
+        tint::reader::wgsl::Parser parser(&context, source);
+
+        // TODO: This is a duplicate parse with ValidateWGSL, need to store
+        // state between calls to avoid this.
+        if (!parser.Parse()) {
+            errorStream << "Parser: " << parser.error() << std::endl;
+            return DAWN_VALIDATION_ERROR(errorStream.str().c_str());
+        }
+
+        tint::ast::Module module = parser.module();
+        if (!module.IsValid()) {
+            errorStream << "Invalid module generated..." << std::endl;
+            return DAWN_VALIDATION_ERROR(errorStream.str().c_str());
+        }
+
+        tint::ast::transform::VertexPullingTransform transform(&context, &module);
+        auto state = std::make_unique<tint::ast::transform::VertexStateDescriptor>();
+        for (uint32_t i = 0; i < vertexState.vertexBufferCount; ++i) {
+            auto& vertexBuffer = vertexState.vertexBuffers[i];
+            tint::ast::transform::VertexBufferLayoutDescriptor layout;
+            layout.array_stride = vertexBuffer.arrayStride;
+            layout.step_mode = ToTintInputStepMode(vertexBuffer.stepMode);
+
+            for (uint32_t j = 0; j < vertexBuffer.attributeCount; ++j) {
+                auto& attribute = vertexBuffer.attributes[j];
+                tint::ast::transform::VertexAttributeDescriptor attr;
+                attr.format = ToTintVertexFormat(attribute.format);
+                attr.offset = attribute.offset;
+                attr.shader_location = attribute.shaderLocation;
+
+                layout.attributes.push_back(std::move(attr));
+            }
+
+            state->vertex_buffers.push_back(std::move(layout));
+        }
+        transform.SetVertexState(std::move(state));
+        transform.SetEntryPoint(entryPoint);
+        transform.SetPullingBufferBindingSet(pullingBufferBindingSet);
+
+        if (!transform.Run()) {
+            errorStream << "Vertex pulling transform: " << transform.GetError();
+            return DAWN_VALIDATION_ERROR(errorStream.str().c_str());
+        }
+
+        tint::TypeDeterminer type_determiner(&context, &module);
+        if (!type_determiner.Determine()) {
+            errorStream << "Type Determination: " << type_determiner.error();
+            return DAWN_VALIDATION_ERROR(errorStream.str().c_str());
+        }
+
+        tint::writer::spirv::Generator generator(std::move(module));
+        if (!generator.Generate()) {
+            errorStream << "Generator: " << generator.error() << std::endl;
+            return DAWN_VALIDATION_ERROR(errorStream.str().c_str());
+        }
+
+        std::vector<uint32_t> spirv = generator.result();
+        return std::move(spirv);
+    }
 #endif  // DAWN_ENABLE_WGSL

    MaybeError ValidateShaderModuleDescriptor(DeviceBase* device,
@ -1094,10 +1239,22 @@ namespace dawn_native {
        return mSpirv;
    }

+#ifdef DAWN_ENABLE_WGSL
+    ResultOrError<std::vector<uint32_t>> ShaderModuleBase::GeneratePullingSpirv(
+        const VertexStateDescriptor& vertexState,
+        const std::string& entryPoint,
+        uint32_t pullingBufferBindingSet) const {
+        return ConvertWGSLToSPIRVWithPulling(mWgsl.c_str(), vertexState, entryPoint,
+                                             pullingBufferBindingSet);
+    }
+#endif
+
    shaderc_spvc::CompileOptions ShaderModuleBase::GetCompileOptions() const {
        shaderc_spvc::CompileOptions options;
        options.SetValidate(GetDevice()->IsValidationEnabled());
        options.SetRobustBufferAccessPass(GetDevice()->IsRobustnessEnabled());
+        options.SetSourceEnvironment(shaderc_target_env_vulkan, shaderc_env_version_vulkan_1_1);
+        options.SetTargetEnvironment(shaderc_target_env_vulkan, shaderc_env_version_vulkan_1_1);
        return options;
    }

--- a/src/dawn_native/ShaderModule.h
+++ b/src/dawn_native/ShaderModule.h
@ -91,6 +91,13 @@ namespace dawn_native {
        shaderc_spvc::Context* GetContext();
        const std::vector<uint32_t>& GetSpirv() const;

+#ifdef DAWN_ENABLE_WGSL
+        ResultOrError<std::vector<uint32_t>> GeneratePullingSpirv(
+            const VertexStateDescriptor& vertexState,
+            const std::string& entryPoint,
+            uint32_t pullingBufferBindingSet) const;
+#endif
+
      protected:
        static MaybeError CheckSpvcSuccess(shaderc_spvc_status status, const char* error_msg);
        shaderc_spvc::CompileOptions GetCompileOptions() const;
--- a/src/dawn_native/Toggles.cpp
+++ b/src/dawn_native/Toggles.cpp
@ -138,7 +138,11 @@ namespace dawn_native {
               "Clear buffers on their first use. This is a temporary toggle only for the "
               "development of buffer lazy initialization and will be removed after buffer lazy "
               "initialization is completely implemented.",
-               "https://crbug.com/dawn/414"}}}};
+               "https://crbug.com/dawn/414"}},
+             {Toggle::MetalEnableVertexPulling,
+              {"metal_enable_vertex_pulling",
+               "Uses vertex pulling to protect out-of-bounds reads on Metal",
+               "https://crbug.com/dawn/480"}}}};

    }  // anonymous namespace

--- a/src/dawn_native/Toggles.h
+++ b/src/dawn_native/Toggles.h
@ -44,6 +44,7 @@ namespace dawn_native {
        UseDXC,
        DisableRobustness,
        LazyClearBufferOnFirstUse,
+        MetalEnableVertexPulling,

        EnumCount,
        InvalidEnum = EnumCount,
--- a/src/dawn_native/metal/CommandBufferMTL.mm
+++ b/src/dawn_native/metal/CommandBufferMTL.mm
@ -263,7 +263,9 @@ namespace dawn_native { namespace metal {
            // MSL code generated by SPIRV-Cross expects.
            PerStage<std::array<uint32_t, kGenericMetalBufferSlots>> data;

-            void Apply(id<MTLRenderCommandEncoder> render, RenderPipeline* pipeline) {
+            void Apply(id<MTLRenderCommandEncoder> render,
+                       RenderPipeline* pipeline,
+                       bool enableVertexPulling) {
                wgpu::ShaderStage stagesToApply =
                    dirtyStages & pipeline->GetStagesRequiringStorageBufferLength();

@ -274,6 +276,11 @@ namespace dawn_native { namespace metal {
                if (stagesToApply & wgpu::ShaderStage::Vertex) {
                    uint32_t bufferCount = ToBackend(pipeline->GetLayout())
                                               ->GetBufferBindingCount(SingleShaderStage::Vertex);
+
+                    if (enableVertexPulling) {
+                        bufferCount += pipeline->GetVertexStateDescriptor()->vertexBufferCount;
+                    }
+
                    [render setVertexBytes:data[SingleShaderStage::Vertex].data()
                                    length:sizeof(uint32_t) * bufferCount
                                   atIndex:kBufferLengthBufferSlot];
@ -483,10 +490,17 @@ namespace dawn_native { namespace metal {
        // all the relevant state.
        class VertexBufferTracker {
          public:
+            explicit VertexBufferTracker(StorageBufferLengthTracker* lengthTracker)
+                : mLengthTracker(lengthTracker) {
+            }
+
            void OnSetVertexBuffer(uint32_t slot, Buffer* buffer, uint64_t offset) {
                mVertexBuffers[slot] = buffer->GetMTLBuffer();
                mVertexBufferOffsets[slot] = offset;

+                ASSERT(buffer->GetSize() < std::numeric_limits<uint32_t>::max());
+                mVertexBufferBindingSizes[slot] = static_cast<uint32_t>(buffer->GetSize() - offset);
+
                // Use 64 bit masks and make sure there are no shift UB
                static_assert(kMaxVertexBuffers <= 8 * sizeof(unsigned long long) - 1, "");
                mDirtyVertexBuffers |= 1ull << slot;
@ -499,13 +513,22 @@ namespace dawn_native { namespace metal {
                mDirtyVertexBuffers |= pipeline->GetVertexBufferSlotsUsed();
            }

-            void Apply(id<MTLRenderCommandEncoder> encoder, RenderPipeline* pipeline) {
+            void Apply(id<MTLRenderCommandEncoder> encoder,
+                       RenderPipeline* pipeline,
+                       bool enableVertexPulling) {
                std::bitset<kMaxVertexBuffers> vertexBuffersToApply =
                    mDirtyVertexBuffers & pipeline->GetVertexBufferSlotsUsed();

                for (uint32_t dawnIndex : IterateBitSet(vertexBuffersToApply)) {
                    uint32_t metalIndex = pipeline->GetMtlVertexBufferIndex(dawnIndex);

+                    if (enableVertexPulling) {
+                        // Insert lengths for vertex buffers bound as storage buffers
+                        mLengthTracker->data[SingleShaderStage::Vertex][metalIndex] =
+                            mVertexBufferBindingSizes[dawnIndex];
+                        mLengthTracker->dirtyStages |= wgpu::ShaderStage::Vertex;
+                    }
+
                    [encoder setVertexBuffers:&mVertexBuffers[dawnIndex]
                                      offsets:&mVertexBufferOffsets[dawnIndex]
                                    withRange:NSMakeRange(metalIndex, 1)];
@ -519,6 +542,9 @@ namespace dawn_native { namespace metal {
            std::bitset<kMaxVertexBuffers> mDirtyVertexBuffers;
            std::array<id<MTLBuffer>, kMaxVertexBuffers> mVertexBuffers;
            std::array<NSUInteger, kMaxVertexBuffers> mVertexBufferOffsets;
+            std::array<uint32_t, kMaxVertexBuffers> mVertexBufferBindingSizes;
+
+            StorageBufferLengthTracker* mLengthTracker;
        };

    }  // anonymous namespace
@ -949,11 +975,12 @@ namespace dawn_native { namespace metal {
                                                       MTLRenderPassDescriptor* mtlRenderPass,
                                                       uint32_t width,
                                                       uint32_t height) {
+        bool enableVertexPulling = GetDevice()->IsToggleEnabled(Toggle::MetalEnableVertexPulling);
        RenderPipeline* lastPipeline = nullptr;
        id<MTLBuffer> indexBuffer = nil;
        uint32_t indexBufferBaseOffset = 0;
-        VertexBufferTracker vertexBuffers;
        StorageBufferLengthTracker storageBufferLengths = {};
+        VertexBufferTracker vertexBuffers(&storageBufferLengths);
        BindGroupTracker bindGroups(&storageBufferLengths);

        id<MTLRenderCommandEncoder> encoder = commandContext->BeginRender(mtlRenderPass);
@ -963,9 +990,9 @@ namespace dawn_native { namespace metal {
                case Command::Draw: {
                    DrawCmd* draw = iter->NextCommand<DrawCmd>();

-                    vertexBuffers.Apply(encoder, lastPipeline);
+                    vertexBuffers.Apply(encoder, lastPipeline, enableVertexPulling);
                    bindGroups.Apply(encoder);
-                    storageBufferLengths.Apply(encoder, lastPipeline);
+                    storageBufferLengths.Apply(encoder, lastPipeline, enableVertexPulling);

                    // The instance count must be non-zero, otherwise no-op
                    if (draw->instanceCount != 0) {
@ -991,9 +1018,9 @@ namespace dawn_native { namespace metal {
                    size_t formatSize =
                        IndexFormatSize(lastPipeline->GetVertexStateDescriptor()->indexFormat);

-                    vertexBuffers.Apply(encoder, lastPipeline);
+                    vertexBuffers.Apply(encoder, lastPipeline, enableVertexPulling);
                    bindGroups.Apply(encoder);
-                    storageBufferLengths.Apply(encoder, lastPipeline);
+                    storageBufferLengths.Apply(encoder, lastPipeline, enableVertexPulling);

                    // The index and instance count must be non-zero, otherwise no-op
                    if (draw->indexCount != 0 && draw->instanceCount != 0) {
@ -1025,9 +1052,9 @@ namespace dawn_native { namespace metal {
                case Command::DrawIndirect: {
                    DrawIndirectCmd* draw = iter->NextCommand<DrawIndirectCmd>();

-                    vertexBuffers.Apply(encoder, lastPipeline);
+                    vertexBuffers.Apply(encoder, lastPipeline, enableVertexPulling);
                    bindGroups.Apply(encoder);
-                    storageBufferLengths.Apply(encoder, lastPipeline);
+                    storageBufferLengths.Apply(encoder, lastPipeline, enableVertexPulling);

                    Buffer* buffer = ToBackend(draw->indirectBuffer.Get());
                    id<MTLBuffer> indirectBuffer = buffer->GetMTLBuffer();
@ -1040,9 +1067,9 @@ namespace dawn_native { namespace metal {
                case Command::DrawIndexedIndirect: {
                    DrawIndirectCmd* draw = iter->NextCommand<DrawIndirectCmd>();

-                    vertexBuffers.Apply(encoder, lastPipeline);
+                    vertexBuffers.Apply(encoder, lastPipeline, enableVertexPulling);
                    bindGroups.Apply(encoder);
-                    storageBufferLengths.Apply(encoder, lastPipeline);
+                    storageBufferLengths.Apply(encoder, lastPipeline, enableVertexPulling);

                    Buffer* buffer = ToBackend(draw->indirectBuffer.Get());
                    id<MTLBuffer> indirectBuffer = buffer->GetMTLBuffer();
--- a/src/dawn_native/metal/DeviceMTL.mm
+++ b/src/dawn_native/metal/DeviceMTL.mm
@ -61,6 +61,11 @@ namespace dawn_native { namespace metal {

    MaybeError Device::Initialize() {
        InitTogglesFromDriver();
+
+        if (!IsRobustnessEnabled() || !IsToggleEnabled(Toggle::UseSpvc)) {
+            ForceSetToggle(Toggle::MetalEnableVertexPulling, false);
+        }
+
        mCommandQueue = [mMtlDevice newCommandQueue];

        return DeviceBase::Initialize(new Queue(this));
--- a/src/dawn_native/metal/RenderPipelineMTL.mm
+++ b/src/dawn_native/metal/RenderPipelineMTL.mm
@ -329,11 +329,24 @@ namespace dawn_native { namespace metal {

        MTLRenderPipelineDescriptor* descriptorMTL = [MTLRenderPipelineDescriptor new];

+        // TODO: MakeVertexDesc should be const in the future, so we don't need to call it here when
+        // vertex pulling is enabled
+        MTLVertexDescriptor* vertexDesc = MakeVertexDesc();
+        descriptorMTL.vertexDescriptor = vertexDesc;
+        [vertexDesc release];
+
+        if (GetDevice()->IsToggleEnabled(Toggle::MetalEnableVertexPulling)) {
+            // Calling MakeVertexDesc first is important since it sets indices for packed bindings
+            MTLVertexDescriptor* emptyVertexDesc = [MTLVertexDescriptor new];
+            descriptorMTL.vertexDescriptor = emptyVertexDesc;
+            [emptyVertexDesc release];
+        }
+
        ShaderModule* vertexModule = ToBackend(descriptor->vertexStage.module);
        const char* vertexEntryPoint = descriptor->vertexStage.entryPoint;
        ShaderModule::MetalFunctionData vertexData;
        DAWN_TRY(vertexModule->GetFunction(vertexEntryPoint, SingleShaderStage::Vertex,
-                                           ToBackend(GetLayout()), &vertexData));
+                                           ToBackend(GetLayout()), &vertexData, 0xFFFFFFFF, this));

        descriptorMTL.vertexFunction = vertexData.function;
        if (vertexData.needsStorageBufferLength) {
@ -377,11 +390,6 @@ namespace dawn_native { namespace metal {
        }

        descriptorMTL.inputPrimitiveTopology = MTLInputPrimitiveTopology(GetPrimitiveTopology());
-
-        MTLVertexDescriptor* vertexDesc = MakeVertexDesc();
-        descriptorMTL.vertexDescriptor = vertexDesc;
-        [vertexDesc release];
-
        descriptorMTL.sampleCount = GetSampleCount();
        descriptorMTL.alphaToCoverageEnabled = descriptor->alphaToCoverageEnabled;

--- a/src/dawn_native/metal/ShaderModuleMTL.h
+++ b/src/dawn_native/metal/ShaderModuleMTL.h
@ -29,6 +29,7 @@ namespace dawn_native { namespace metal {

    class Device;
    class PipelineLayout;
+    class RenderPipeline;

    class ShaderModule final : public ShaderModuleBase {
      public:
@ -47,7 +48,8 @@ namespace dawn_native { namespace metal {
                               SingleShaderStage functionStage,
                               const PipelineLayout* layout,
                               MetalFunctionData* out,
-                               uint32_t sampleMask = 0xFFFFFFFF);
+                               uint32_t sampleMask = 0xFFFFFFFF,
+                               const RenderPipeline* renderPipeline = nullptr);

      private:
        ShaderModule(Device* device, const ShaderModuleDescriptor* descriptor);
--- a/src/dawn_native/metal/ShaderModuleMTL.mm
+++ b/src/dawn_native/metal/ShaderModuleMTL.mm
@ -17,6 +17,7 @@
 #include "dawn_native/BindGroupLayout.h"
 #include "dawn_native/metal/DeviceMTL.h"
 #include "dawn_native/metal/PipelineLayoutMTL.h"
+#include "dawn_native/metal/RenderPipelineMTL.h"

 #include <spirv_msl.hpp>

@ -92,10 +93,24 @@ namespace dawn_native { namespace metal {
                                         SingleShaderStage functionStage,
                                         const PipelineLayout* layout,
                                         ShaderModule::MetalFunctionData* out,
-                                         uint32_t sampleMask) {
+                                         uint32_t sampleMask,
+                                         const RenderPipeline* renderPipeline) {
        ASSERT(!IsError());
        ASSERT(out);
-        const std::vector<uint32_t>& spirv = GetSpirv();
+        const std::vector<uint32_t>* spirv = &GetSpirv();
+
+#ifdef DAWN_ENABLE_WGSL
+        // Use set 4 since it is bigger than what users can access currently
+        static const uint32_t kPullingBufferBindingSet = 4;
+        std::vector<uint32_t> pullingSpirv;
+        if (GetDevice()->IsToggleEnabled(Toggle::MetalEnableVertexPulling) &&
+            functionStage == SingleShaderStage::Vertex) {
+            DAWN_TRY_ASSIGN(pullingSpirv,
+                            GeneratePullingSpirv(*renderPipeline->GetVertexStateDescriptor(),
+                                                 functionName, kPullingBufferBindingSet));
+            spirv = &pullingSpirv;
+        }
+#endif

        std::unique_ptr<spirv_cross::CompilerMSL> compilerImpl;
        spirv_cross::CompilerMSL* compiler;
@ -103,7 +118,7 @@ namespace dawn_native { namespace metal {
            // Initializing the compiler is needed every call, because this method uses reflection
            // to mutate the compiler's IR.
            DAWN_TRY(
-                CheckSpvcSuccess(mSpvcContext.InitializeForMsl(spirv.data(), spirv.size(),
+                CheckSpvcSuccess(mSpvcContext.InitializeForMsl(spirv->data(), spirv->size(),
                                                               GetMSLCompileOptions(sampleMask)),
                                 "Unable to initialize instance of spvc"));
            DAWN_TRY(CheckSpvcSuccess(mSpvcContext.GetCompiler(reinterpret_cast<void**>(&compiler)),
@ -126,7 +141,7 @@ namespace dawn_native { namespace metal {

            options_msl.additional_fixed_sample_mask = sampleMask;

-            compilerImpl = std::make_unique<spirv_cross::CompilerMSL>(spirv);
+            compilerImpl = std::make_unique<spirv_cross::CompilerMSL>(*spirv);
            compiler = compilerImpl.get();
            compiler->set_msl_options(options_msl);
        }
@ -172,6 +187,22 @@ namespace dawn_native { namespace metal {
            }
        }

+        // Add vertex buffers bound as storage buffers
+        if (GetDevice()->IsToggleEnabled(Toggle::MetalEnableVertexPulling) &&
+            functionStage == SingleShaderStage::Vertex) {
+            for (uint32_t dawnIndex : IterateBitSet(renderPipeline->GetVertexBufferSlotsUsed())) {
+                uint32_t metalIndex = renderPipeline->GetMtlVertexBufferIndex(dawnIndex);
+
+                shaderc_spvc_msl_resource_binding mslBinding;
+                mslBinding.stage = ToSpvcExecutionModel(SingleShaderStage::Vertex);
+                mslBinding.desc_set = kPullingBufferBindingSet;
+                mslBinding.binding = dawnIndex;
+                mslBinding.msl_buffer = metalIndex;
+                DAWN_TRY(CheckSpvcSuccess(mSpvcContext.AddMSLResourceBinding(mslBinding),
+                                          "Unable to add MSL Resource Binding"));
+            }
+        }
+
        {
            if (GetDevice()->IsToggleEnabled(Toggle::UseSpvc)) {
                shaderc_spvc_execution_model executionModel = ToSpvcExecutionModel(functionStage);
@ -245,6 +276,11 @@ namespace dawn_native { namespace metal {
            out->needsStorageBufferLength = compiler->needs_buffer_size_buffer();
        }

+        if (GetDevice()->IsToggleEnabled(Toggle::MetalEnableVertexPulling) &&
+            functionStage == SingleShaderStage::Vertex && GetUsedVertexAttributes().any()) {
+            out->needsStorageBufferLength = true;
+        }
+
        return {};
    }

--- a/src/tests/BUILD.gn
+++ b/src/tests/BUILD.gn
@ -337,6 +337,10 @@ source_set("dawn_end2end_tests_sources") {
    frameworks = [ "IOSurface.framework" ]
  }

+  if (dawn_enable_wgsl) {
+    sources += [ "end2end/VertexBufferRobustnessTests.cpp" ]
+  }
+
  if (dawn_enable_opengl) {
    assert(dawn_supports_glfw_for_windowing)
  }
--- a/src/tests/end2end/VertexBufferRobustnessTests.cpp
+++ b/src/tests/end2end/VertexBufferRobustnessTests.cpp
@ -0,0 +1,231 @@
+// Copyright 2020 The Dawn Authors
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+#include "common/Assert.h"
+#include "common/Constants.h"
+#include "common/Math.h"
+#include "tests/DawnTest.h"
+#include "utils/ComboRenderPipelineDescriptor.h"
+#include "utils/WGPUHelpers.h"
+
+// Vertex buffer robustness tests that clamping is applied on vertex attributes. This would happen
+// on backends where vertex pulling is enabled, such as Metal.
+
+class VertexBufferRobustnessTest : public DawnTest {
+  protected:
+    void SetUp() override {
+        DawnTest::SetUp();
+        // SPVC must be used currently, since we rely on the robustness pass in it
+        DAWN_SKIP_TEST_IF(!IsSpvcBeingUsed());
+    }
+
+    // Creates a vertex module that tests an expression with given attributes. If successful, the
+    // point drawn would be moved out of the viewport. On failure, the point is kept inside the
+    // viewport.
+    wgpu::ShaderModule CreateVertexModule(const std::string& attributes,
+                                          const std::string& successExpression) {
+        return utils::CreateShaderModuleFromWGSL(device, (R"(
+                entry_point vertex as "main" = vtx_main;
+
+                )" + attributes + R"(
+                [[builtin position]] var<out> Position : vec4<f32>;
+
+                fn vtx_main() -> void {
+                    if ()" + successExpression + R"() {
+                        # Success case, move the vertex out of the viewport
+                        Position = vec4<f32>(-10.0, 0.0, 0.0, 1.0);
+                    } else {
+                        # Failure case, move the vertex inside the viewport
+                        Position = vec4<f32>(0.0, 0.0, 0.0, 1.0);
+                    }
+                    return;
+                }
+            )")
+                                                             .c_str());
+    }
+
+    // Runs the test, a true |expectation| meaning success
+    void DoTest(const std::string& attributes,
+                const std::string& successExpression,
+                utils::ComboVertexStateDescriptor vertexState,
+                wgpu::Buffer vertexBuffer,
+                uint64_t bufferOffset,
+                bool expectation) {
+        wgpu::ShaderModule vsModule = CreateVertexModule(attributes, successExpression);
+        wgpu::ShaderModule fsModule = utils::CreateShaderModuleFromWGSL(device, R"(
+                entry_point fragment as "main" = frag_main;
+                [[location 0]] var<out> outColor : vec4<f32>;
+                fn frag_main() -> void {
+                    outColor = vec4<f32>(1.0, 1.0, 1.0, 1.0);
+                    return;
+                }
+            )");
+
+        utils::BasicRenderPass renderPass = utils::CreateBasicRenderPass(device, 1, 1);
+
+        utils::ComboRenderPipelineDescriptor descriptor(device);
+        descriptor.vertexStage.module = vsModule;
+        descriptor.cFragmentStage.module = fsModule;
+        descriptor.primitiveTopology = wgpu::PrimitiveTopology::PointList;
+        descriptor.cVertexState = std::move(vertexState);
+        descriptor.cColorStates[0].format = renderPass.colorFormat;
+        renderPass.renderPassInfo.cColorAttachments[0].clearColor = {0, 0, 0, 1};
+
+        wgpu::RenderPipeline pipeline = device.CreateRenderPipeline(&descriptor);
+
+        wgpu::CommandEncoder encoder = device.CreateCommandEncoder();
+        wgpu::RenderPassEncoder pass = encoder.BeginRenderPass(&renderPass.renderPassInfo);
+        pass.SetPipeline(pipeline);
+        pass.SetVertexBuffer(0, vertexBuffer, bufferOffset);
+        pass.Draw(1000);
+        pass.EndPass();
+
+        wgpu::CommandBuffer commands = encoder.Finish();
+        queue.Submit(1, &commands);
+
+        RGBA8 noOutput(0, 0, 0, 255);
+        RGBA8 someOutput(255, 255, 255, 255);
+        EXPECT_PIXEL_RGBA8_EQ(expectation ? noOutput : someOutput, renderPass.color, 0, 0);
+    }
+};
+
+TEST_P(VertexBufferRobustnessTest, DetectInvalidValues) {
+    utils::ComboVertexStateDescriptor vertexState;
+    vertexState.vertexBufferCount = 1;
+    vertexState.cVertexBuffers[0].arrayStride = sizeof(float);
+    vertexState.cVertexBuffers[0].attributeCount = 1;
+    vertexState.cAttributes[0].format = wgpu::VertexFormat::Float;
+    vertexState.cAttributes[0].offset = 0;
+    vertexState.cAttributes[0].shaderLocation = 0;
+
+    // Bind at an offset of 0, so we see 111.0, leading to failure
+    float kVertices[] = {111.0, 473.0, 473.0};
+    wgpu::Buffer vertexBuffer = utils::CreateBufferFromData(device, kVertices, sizeof(kVertices),
+                                                            wgpu::BufferUsage::Vertex);
+
+    DoTest("[[location 0]] var<in> a : f32;", "a == 473.0", std::move(vertexState), vertexBuffer, 0,
+           false);
+}
+
+TEST_P(VertexBufferRobustnessTest, FloatClamp) {
+    utils::ComboVertexStateDescriptor vertexState;
+    vertexState.vertexBufferCount = 1;
+    vertexState.cVertexBuffers[0].arrayStride = sizeof(float);
+    vertexState.cVertexBuffers[0].attributeCount = 1;
+    vertexState.cAttributes[0].format = wgpu::VertexFormat::Float;
+    vertexState.cAttributes[0].offset = 0;
+    vertexState.cAttributes[0].shaderLocation = 0;
+
+    // Bind at an offset of 4, so we clamp to only values containing 473.0
+    float kVertices[] = {111.0, 473.0, 473.0};
+    wgpu::Buffer vertexBuffer = utils::CreateBufferFromData(device, kVertices, sizeof(kVertices),
+                                                            wgpu::BufferUsage::Vertex);
+
+    DoTest("[[location 0]] var<in> a : f32;", "a == 473.0", std::move(vertexState), vertexBuffer, 4,
+           true);
+}
+
+TEST_P(VertexBufferRobustnessTest, IntClamp) {
+    utils::ComboVertexStateDescriptor vertexState;
+    vertexState.vertexBufferCount = 1;
+    vertexState.cVertexBuffers[0].arrayStride = sizeof(int32_t);
+    vertexState.cVertexBuffers[0].attributeCount = 1;
+    vertexState.cAttributes[0].format = wgpu::VertexFormat::Int;
+    vertexState.cAttributes[0].offset = 0;
+    vertexState.cAttributes[0].shaderLocation = 0;
+
+    // Bind at an offset of 4, so we clamp to only values containing 473
+    int32_t kVertices[] = {111, 473, 473};
+    wgpu::Buffer vertexBuffer = utils::CreateBufferFromData(device, kVertices, sizeof(kVertices),
+                                                            wgpu::BufferUsage::Vertex);
+
+    DoTest("[[location 0]] var<in> a : i32;", "a == 473", std::move(vertexState), vertexBuffer, 4,
+           true);
+}
+
+TEST_P(VertexBufferRobustnessTest, UIntClamp) {
+    utils::ComboVertexStateDescriptor vertexState;
+    vertexState.vertexBufferCount = 1;
+    vertexState.cVertexBuffers[0].arrayStride = sizeof(uint32_t);
+    vertexState.cVertexBuffers[0].attributeCount = 1;
+    vertexState.cAttributes[0].format = wgpu::VertexFormat::UInt;
+    vertexState.cAttributes[0].offset = 0;
+    vertexState.cAttributes[0].shaderLocation = 0;
+
+    // Bind at an offset of 4, so we clamp to only values containing 473
+    uint32_t kVertices[] = {111, 473, 473};
+    wgpu::Buffer vertexBuffer = utils::CreateBufferFromData(device, kVertices, sizeof(kVertices),
+                                                            wgpu::BufferUsage::Vertex);
+
+    DoTest("[[location 0]] var<in> a : u32;", "a == 473", std::move(vertexState), vertexBuffer, 4,
+           true);
+}
+
+TEST_P(VertexBufferRobustnessTest, Float2Clamp) {
+    utils::ComboVertexStateDescriptor vertexState;
+    vertexState.vertexBufferCount = 1;
+    vertexState.cVertexBuffers[0].arrayStride = sizeof(float) * 2;
+    vertexState.cVertexBuffers[0].attributeCount = 1;
+    vertexState.cAttributes[0].format = wgpu::VertexFormat::Float2;
+    vertexState.cAttributes[0].offset = 0;
+    vertexState.cAttributes[0].shaderLocation = 0;
+
+    // Bind at an offset of 8, so we clamp to only values containing 473.0
+    float kVertices[] = {111.0, 111.0, 473.0, 473.0};
+    wgpu::Buffer vertexBuffer = utils::CreateBufferFromData(device, kVertices, sizeof(kVertices),
+                                                            wgpu::BufferUsage::Vertex);
+
+    DoTest("[[location 0]] var<in> a : vec2<f32>;", "a[0] == 473.0 && a[1] == 473.0",
+           std::move(vertexState), vertexBuffer, 8, true);
+}
+
+TEST_P(VertexBufferRobustnessTest, Float3Clamp) {
+    utils::ComboVertexStateDescriptor vertexState;
+    vertexState.vertexBufferCount = 1;
+    vertexState.cVertexBuffers[0].arrayStride = sizeof(float) * 3;
+    vertexState.cVertexBuffers[0].attributeCount = 1;
+    vertexState.cAttributes[0].format = wgpu::VertexFormat::Float3;
+    vertexState.cAttributes[0].offset = 0;
+    vertexState.cAttributes[0].shaderLocation = 0;
+
+    // Bind at an offset of 12, so we clamp to only values containing 473.0
+    float kVertices[] = {111.0, 111.0, 111.0, 473.0, 473.0, 473.0};
+    wgpu::Buffer vertexBuffer = utils::CreateBufferFromData(device, kVertices, sizeof(kVertices),
+                                                            wgpu::BufferUsage::Vertex);
+
+    DoTest("[[location 0]] var<in> a : vec3<f32>;",
+           "a[0] == 473.0 && a[1] == 473.0 && a[2] == 473.0", std::move(vertexState), vertexBuffer,
+           12, true);
+}
+
+TEST_P(VertexBufferRobustnessTest, Float4Clamp) {
+    utils::ComboVertexStateDescriptor vertexState;
+    vertexState.vertexBufferCount = 1;
+    vertexState.cVertexBuffers[0].arrayStride = sizeof(float) * 4;
+    vertexState.cVertexBuffers[0].attributeCount = 1;
+    vertexState.cAttributes[0].format = wgpu::VertexFormat::Float4;
+    vertexState.cAttributes[0].offset = 0;
+    vertexState.cAttributes[0].shaderLocation = 0;
+
+    // Bind at an offset of 16, so we clamp to only values containing 473.0
+    float kVertices[] = {111.0, 111.0, 111.0, 111.0, 473.0, 473.0, 473.0, 473.0};
+    wgpu::Buffer vertexBuffer = utils::CreateBufferFromData(device, kVertices, sizeof(kVertices),
+                                                            wgpu::BufferUsage::Vertex);
+
+    DoTest("[[location 0]] var<in> a : vec4<f32>;",
+           "a[0] == 473.0 && a[1] == 473.0 && a[2] == 473.0 && a[3] == 473.0",
+           std::move(vertexState), vertexBuffer, 16, true);
+}
+
+DAWN_INSTANTIATE_TEST(VertexBufferRobustnessTest, MetalBackend({"metal_enable_vertex_pulling"}));
--- a/src/utils/WGPUHelpers.cpp
+++ b/src/utils/WGPUHelpers.cpp
@ -144,6 +144,14 @@ namespace utils {
        return CreateShaderModuleFromResult(device, result);
    }

+    wgpu::ShaderModule CreateShaderModuleFromWGSL(const wgpu::Device& device, const char* source) {
+        wgpu::ShaderModuleWGSLDescriptor wgslDesc;
+        wgslDesc.source = source;
+        wgpu::ShaderModuleDescriptor descriptor;
+        descriptor.nextInChain = &wgslDesc;
+        return device.CreateShaderModule(&descriptor);
+    }
+
    std::vector<uint32_t> CompileGLSLToSpirv(SingleShaderStage stage, const char* source) {
        shaderc_shader_kind kind = ShadercShaderKind(stage);

--- a/src/utils/WGPUHelpers.h
+++ b/src/utils/WGPUHelpers.h
@ -34,6 +34,8 @@ namespace utils {
                                          SingleShaderStage stage,
                                          const char* source);
    wgpu::ShaderModule CreateShaderModuleFromASM(const wgpu::Device& device, const char* source);
+    wgpu::ShaderModule CreateShaderModuleFromWGSL(const wgpu::Device& device, const char* source);
+
    std::vector<uint32_t> CompileGLSLToSpirv(SingleShaderStage stage, const char* source);

    wgpu::Buffer CreateBufferFromData(const wgpu::Device& device,