dawn-cmake/test/bug/tint/914.wgsl.expected.msl

#include <metal_stdlib>

using namespace metal;
struct Uniforms {
  /* 0x0000 */ uint dimAOuter;
  /* 0x0004 */ uint dimInner;
  /* 0x0008 */ uint dimBOuter;
};
struct Matrix {
  /* 0x0000 */ float numbers[1];
};
struct tint_array_wrapper_1 {
  float arr[64];
};
struct tint_array_wrapper {
  tint_array_wrapper_1 arr[64];
};
struct tint_array_wrapper_2 {
  float arr[16];
};
struct tint_array_wrapper_3 {
  float arr[4];
};

constant uint RowPerThread = 4u;
constant uint ColPerThread = 4u;
constant uint TileAOuter = 64u;
constant uint TileBOuter = 64u;
constant uint TileInner = 64u;
float mm_readA(constant Uniforms& uniforms, const device Matrix& firstMatrix, uint row, uint col) {
  if (((row < uniforms.dimAOuter) && (col < uniforms.dimInner))) {
    float const result = firstMatrix.numbers[((row * uniforms.dimInner) + col)];
    return result;
  }
  return 0.0f;
}

float mm_readB(constant Uniforms& uniforms, const device Matrix& secondMatrix, uint row, uint col) {
  if (((row < uniforms.dimInner) && (col < uniforms.dimBOuter))) {
    float const result = secondMatrix.numbers[((row * uniforms.dimBOuter) + col)];
    return result;
  }
  return 0.0f;
}

void mm_write(constant Uniforms& uniforms, device Matrix& resultMatrix, uint row, uint col, float value) {
  if (((row < uniforms.dimAOuter) && (col < uniforms.dimBOuter))) {
    uint const index = (col + (row * uniforms.dimBOuter));
    resultMatrix.numbers[index] = value;
  }
}

kernel void tint_symbol(uint3 local_id [[thread_position_in_threadgroup]], uint3 global_id [[thread_position_in_grid]], uint local_invocation_index [[thread_index_in_threadgroup]], constant Uniforms& uniforms [[buffer(3)]], const device Matrix& firstMatrix [[buffer(0)]], const device Matrix& secondMatrix [[buffer(1)]], device Matrix& resultMatrix [[buffer(2)]]) {
  threadgroup tint_array_wrapper tint_symbol_4;
  threadgroup tint_array_wrapper tint_symbol_5;
  if ((local_invocation_index == 0u)) {
    tint_array_wrapper const tint_symbol_2 = {.arr={}};
    tint_symbol_4 = tint_symbol_2;
    tint_array_wrapper const tint_symbol_3 = {.arr={}};
    tint_symbol_5 = tint_symbol_3;
  }
    threadgroup_barrier(mem_flags::mem_threadgroup);
  uint const tileRow = (local_id.y * RowPerThread);
  uint const tileCol = (local_id.x * ColPerThread);
  uint const globalRow = (global_id.y * RowPerThread);
  uint const globalCol = (global_id.x * ColPerThread);
  uint const numTiles = (((uniforms.dimInner - 1u) / TileInner) + 1u);
  tint_array_wrapper_2 acc = {};
  float ACached = 0.0f;
  tint_array_wrapper_3 BCached = {};
  {
    uint index = 0u;
    while (true) {
      if (!((index < (RowPerThread * ColPerThread)))) {
        break;
      }
      acc.arr[index] = 0.0f;
      {
        index = (index + 1u);
      }
    }
  }
  uint const ColPerThreadA = (TileInner / 16u);
  uint const tileColA = (local_id.x * ColPerThreadA);
  uint const RowPerThreadB = (TileInner / 16u);
  uint const tileRowB = (local_id.y * RowPerThreadB);
  {
    uint t = 0u;
    while (true) {
      if (!((t < numTiles))) {
        break;
      }
      {
        uint innerRow = 0u;
        while (true) {
          if (!((innerRow < RowPerThread))) {
            break;
          }
          {
            uint innerCol = 0u;
            while (true) {
              if (!((innerCol < ColPerThreadA))) {
                break;
              }
              uint const inputRow = (tileRow + innerRow);
              uint const inputCol = (tileColA + innerCol);
              tint_symbol_4.arr[inputRow].arr[inputCol] = mm_readA(uniforms, firstMatrix, (globalRow + innerRow), ((t * TileInner) + inputCol));
              {
                innerCol = (innerCol + 1u);
              }
            }
          }
          {
            innerRow = (innerRow + 1u);
          }
        }
      }
      {
        uint innerRow = 0u;
        while (true) {
          if (!((innerRow < RowPerThreadB))) {
            break;
          }
          {
            uint innerCol = 0u;
            while (true) {
              if (!((innerCol < ColPerThread))) {
                break;
              }
              uint const inputRow = (tileRowB + innerRow);
              uint const inputCol = (tileCol + innerCol);
              tint_symbol_5.arr[innerCol].arr[inputCol] = mm_readB(uniforms, secondMatrix, ((t * TileInner) + inputRow), (globalCol + innerCol));
              {
                innerCol = (innerCol + 1u);
              }
            }
          }
          {
            innerRow = (innerRow + 1u);
          }
        }
      }
            threadgroup_barrier(mem_flags::mem_threadgroup);
      {
        uint k = 0u;
        while (true) {
          if (!((k < TileInner))) {
            break;
          }
          {
            uint inner = 0u;
            while (true) {
              if (!((inner < ColPerThread))) {
                break;
              }
              BCached.arr[inner] = tint_symbol_5.arr[k].arr[(tileCol + inner)];
              {
                inner = (inner + 1u);
              }
            }
          }
          {
            uint innerRow = 0u;
            while (true) {
              if (!((innerRow < RowPerThread))) {
                break;
              }
              ACached = tint_symbol_4.arr[(tileRow + innerRow)].arr[k];
              {
                uint innerCol = 0u;
                while (true) {
                  if (!((innerCol < ColPerThread))) {
                    break;
                  }
                  uint const index = ((innerRow * ColPerThread) + innerCol);
                  acc.arr[index] = (acc.arr[index] + (ACached * BCached.arr[innerCol]));
                  {
                    innerCol = (innerCol + 1u);
                  }
                }
              }
              {
                innerRow = (innerRow + 1u);
              }
            }
          }
          {
            k = (k + 1u);
          }
        }
      }
            threadgroup_barrier(mem_flags::mem_threadgroup);
      {
        t = (t + 1u);
      }
    }
  }
  {
    uint innerRow = 0u;
    while (true) {
      if (!((innerRow < RowPerThread))) {
        break;
      }
      {
        uint innerCol = 0u;
        while (true) {
          if (!((innerCol < ColPerThread))) {
            break;
          }
          uint const index = ((innerRow * ColPerThread) + innerCol);
          mm_write(uniforms, resultMatrix, (globalRow + innerRow), (globalCol + innerCol), acc.arr[index]);
          {
            innerCol = (innerCol + 1u);
          }
        }
      }
      {
        innerRow = (innerRow + 1u);
      }
    }
  }
  return;
}
writer/msl: Fix continuing block emission Inline the `continuing` block in the places where `continue` is called. Simplifies the emission, and fixes emission of `let` statements in the loop. This fix matches the same approach in writer/hlsl. See: https://dawn-review.googlesource.com/c/tint/+/51784 Fixed: tint:833 Fixed: tint:914 Change-Id: If4d8cde62dfaf8efa24272854ca7ff5edc0a8234 Reviewed-on: https://dawn-review.googlesource.com/c/tint/+/55341 Commit-Queue: Ben Clayton <bclayton@chromium.org> Kokoro: Kokoro <noreply+kokoro@google.com> Reviewed-by: David Neto <dneto@google.com> 2021-06-21 08:49:27 +00:00			`#include <metal_stdlib>`
test: Add bug case for tint:914 Bug: tint:914 Change-Id: Id17b675e947b170e460c415c15d5d75f311e65b0 Reviewed-on: https://dawn-review.googlesource.com/c/tint/+/55247 Kokoro: Kokoro <noreply+kokoro@google.com> Auto-Submit: Ben Clayton <bclayton@google.com> Commit-Queue: James Price <jrprice@google.com> Reviewed-by: James Price <jrprice@google.com> 2021-06-19 17:34:35 +00:00
writer/msl: Fix continuing block emission Inline the `continuing` block in the places where `continue` is called. Simplifies the emission, and fixes emission of `let` statements in the loop. This fix matches the same approach in writer/hlsl. See: https://dawn-review.googlesource.com/c/tint/+/51784 Fixed: tint:833 Fixed: tint:914 Change-Id: If4d8cde62dfaf8efa24272854ca7ff5edc0a8234 Reviewed-on: https://dawn-review.googlesource.com/c/tint/+/55341 Commit-Queue: Ben Clayton <bclayton@chromium.org> Kokoro: Kokoro <noreply+kokoro@google.com> Reviewed-by: David Neto <dneto@google.com> 2021-06-21 08:49:27 +00:00			`using namespace metal;`
			`struct Uniforms {`
			`/* 0x0000 */ uint dimAOuter;`
			`/* 0x0004 */ uint dimInner;`
			`/* 0x0008 */ uint dimBOuter;`
			`};`
			`struct Matrix {`
			`/* 0x0000 */ float numbers[1];`
			`};`
			`struct tint_array_wrapper_1 {`
			`float arr[64];`
			`};`
			`struct tint_array_wrapper {`
			`tint_array_wrapper_1 arr[64];`
			`};`
			`struct tint_array_wrapper_2 {`
			`float arr[16];`
			`};`
			`struct tint_array_wrapper_3 {`
			`float arr[4];`
			`};`
test: Add bug case for tint:914 Bug: tint:914 Change-Id: Id17b675e947b170e460c415c15d5d75f311e65b0 Reviewed-on: https://dawn-review.googlesource.com/c/tint/+/55247 Kokoro: Kokoro <noreply+kokoro@google.com> Auto-Submit: Ben Clayton <bclayton@google.com> Commit-Queue: James Price <jrprice@google.com> Reviewed-by: James Price <jrprice@google.com> 2021-06-19 17:34:35 +00:00
writer/msl: Fix continuing block emission Inline the `continuing` block in the places where `continue` is called. Simplifies the emission, and fixes emission of `let` statements in the loop. This fix matches the same approach in writer/hlsl. See: https://dawn-review.googlesource.com/c/tint/+/51784 Fixed: tint:833 Fixed: tint:914 Change-Id: If4d8cde62dfaf8efa24272854ca7ff5edc0a8234 Reviewed-on: https://dawn-review.googlesource.com/c/tint/+/55341 Commit-Queue: Ben Clayton <bclayton@chromium.org> Kokoro: Kokoro <noreply+kokoro@google.com> Reviewed-by: David Neto <dneto@google.com> 2021-06-21 08:49:27 +00:00			`constant uint RowPerThread = 4u;`
			`constant uint ColPerThread = 4u;`
			`constant uint TileAOuter = 64u;`
			`constant uint TileBOuter = 64u;`
			`constant uint TileInner = 64u;`
			`float mm_readA(constant Uniforms& uniforms, const device Matrix& firstMatrix, uint row, uint col) {`
			`if (((row < uniforms.dimAOuter) && (col < uniforms.dimInner))) {`
			`float const result = firstMatrix.numbers[((row * uniforms.dimInner) + col)];`
			`return result;`
			`}`
			`return 0.0f;`
			`}`
test: Add bug case for tint:914 Bug: tint:914 Change-Id: Id17b675e947b170e460c415c15d5d75f311e65b0 Reviewed-on: https://dawn-review.googlesource.com/c/tint/+/55247 Kokoro: Kokoro <noreply+kokoro@google.com> Auto-Submit: Ben Clayton <bclayton@google.com> Commit-Queue: James Price <jrprice@google.com> Reviewed-by: James Price <jrprice@google.com> 2021-06-19 17:34:35 +00:00
writer/msl: Fix continuing block emission Inline the `continuing` block in the places where `continue` is called. Simplifies the emission, and fixes emission of `let` statements in the loop. This fix matches the same approach in writer/hlsl. See: https://dawn-review.googlesource.com/c/tint/+/51784 Fixed: tint:833 Fixed: tint:914 Change-Id: If4d8cde62dfaf8efa24272854ca7ff5edc0a8234 Reviewed-on: https://dawn-review.googlesource.com/c/tint/+/55341 Commit-Queue: Ben Clayton <bclayton@chromium.org> Kokoro: Kokoro <noreply+kokoro@google.com> Reviewed-by: David Neto <dneto@google.com> 2021-06-21 08:49:27 +00:00			`float mm_readB(constant Uniforms& uniforms, const device Matrix& secondMatrix, uint row, uint col) {`
			`if (((row < uniforms.dimInner) && (col < uniforms.dimBOuter))) {`
			`float const result = secondMatrix.numbers[((row * uniforms.dimBOuter) + col)];`
			`return result;`
			`}`
			`return 0.0f;`
			`}`
test: Add bug case for tint:914 Bug: tint:914 Change-Id: Id17b675e947b170e460c415c15d5d75f311e65b0 Reviewed-on: https://dawn-review.googlesource.com/c/tint/+/55247 Kokoro: Kokoro <noreply+kokoro@google.com> Auto-Submit: Ben Clayton <bclayton@google.com> Commit-Queue: James Price <jrprice@google.com> Reviewed-by: James Price <jrprice@google.com> 2021-06-19 17:34:35 +00:00
writer/msl: Fix continuing block emission Inline the `continuing` block in the places where `continue` is called. Simplifies the emission, and fixes emission of `let` statements in the loop. This fix matches the same approach in writer/hlsl. See: https://dawn-review.googlesource.com/c/tint/+/51784 Fixed: tint:833 Fixed: tint:914 Change-Id: If4d8cde62dfaf8efa24272854ca7ff5edc0a8234 Reviewed-on: https://dawn-review.googlesource.com/c/tint/+/55341 Commit-Queue: Ben Clayton <bclayton@chromium.org> Kokoro: Kokoro <noreply+kokoro@google.com> Reviewed-by: David Neto <dneto@google.com> 2021-06-21 08:49:27 +00:00			`void mm_write(constant Uniforms& uniforms, device Matrix& resultMatrix, uint row, uint col, float value) {`
			`if (((row < uniforms.dimAOuter) && (col < uniforms.dimBOuter))) {`
			`uint const index = (col + (row * uniforms.dimBOuter));`
			`resultMatrix.numbers[index] = value;`
			`}`
			`}`
test: Add bug case for tint:914 Bug: tint:914 Change-Id: Id17b675e947b170e460c415c15d5d75f311e65b0 Reviewed-on: https://dawn-review.googlesource.com/c/tint/+/55247 Kokoro: Kokoro <noreply+kokoro@google.com> Auto-Submit: Ben Clayton <bclayton@google.com> Commit-Queue: James Price <jrprice@google.com> Reviewed-by: James Price <jrprice@google.com> 2021-06-19 17:34:35 +00:00
writer/msl: Fix continuing block emission Inline the `continuing` block in the places where `continue` is called. Simplifies the emission, and fixes emission of `let` statements in the loop. This fix matches the same approach in writer/hlsl. See: https://dawn-review.googlesource.com/c/tint/+/51784 Fixed: tint:833 Fixed: tint:914 Change-Id: If4d8cde62dfaf8efa24272854ca7ff5edc0a8234 Reviewed-on: https://dawn-review.googlesource.com/c/tint/+/55341 Commit-Queue: Ben Clayton <bclayton@chromium.org> Kokoro: Kokoro <noreply+kokoro@google.com> Reviewed-by: David Neto <dneto@google.com> 2021-06-21 08:49:27 +00:00			`kernel void tint_symbol(uint3 local_id [[thread_position_in_threadgroup]], uint3 global_id [[thread_position_in_grid]], uint local_invocation_index [[thread_index_in_threadgroup]], constant Uniforms& uniforms [[buffer(3)]], const device Matrix& firstMatrix [[buffer(0)]], const device Matrix& secondMatrix [[buffer(1)]], device Matrix& resultMatrix [[buffer(2)]]) {`
			`threadgroup tint_array_wrapper tint_symbol_4;`
			`threadgroup tint_array_wrapper tint_symbol_5;`
test: Add bug case for tint:914 Bug: tint:914 Change-Id: Id17b675e947b170e460c415c15d5d75f311e65b0 Reviewed-on: https://dawn-review.googlesource.com/c/tint/+/55247 Kokoro: Kokoro <noreply+kokoro@google.com> Auto-Submit: Ben Clayton <bclayton@google.com> Commit-Queue: James Price <jrprice@google.com> Reviewed-by: James Price <jrprice@google.com> 2021-06-19 17:34:35 +00:00			`if ((local_invocation_index == 0u)) {`
writer/msl: Fix continuing block emission Inline the `continuing` block in the places where `continue` is called. Simplifies the emission, and fixes emission of `let` statements in the loop. This fix matches the same approach in writer/hlsl. See: https://dawn-review.googlesource.com/c/tint/+/51784 Fixed: tint:833 Fixed: tint:914 Change-Id: If4d8cde62dfaf8efa24272854ca7ff5edc0a8234 Reviewed-on: https://dawn-review.googlesource.com/c/tint/+/55341 Commit-Queue: Ben Clayton <bclayton@chromium.org> Kokoro: Kokoro <noreply+kokoro@google.com> Reviewed-by: David Neto <dneto@google.com> 2021-06-21 08:49:27 +00:00			`tint_array_wrapper const tint_symbol_2 = {.arr={}};`
			`tint_symbol_4 = tint_symbol_2;`
			`tint_array_wrapper const tint_symbol_3 = {.arr={}};`
			`tint_symbol_5 = tint_symbol_3;`
			`}`
			`threadgroup_barrier(mem_flags::mem_threadgroup);`
			`uint const tileRow = (local_id.y * RowPerThread);`
			`uint const tileCol = (local_id.x * ColPerThread);`
			`uint const globalRow = (global_id.y * RowPerThread);`
			`uint const globalCol = (global_id.x * ColPerThread);`
			`uint const numTiles = (((uniforms.dimInner - 1u) / TileInner) + 1u);`
			`tint_array_wrapper_2 acc = {};`
			`float ACached = 0.0f;`
			`tint_array_wrapper_3 BCached = {};`
			`{`
			`uint index = 0u;`
			`while (true) {`
			`if (!((index < (RowPerThread * ColPerThread)))) {`
			`break;`
			`}`
			`acc.arr[index] = 0.0f;`
			`{`
			`index = (index + 1u);`
			`}`
			`}`
			`}`
			`uint const ColPerThreadA = (TileInner / 16u);`
			`uint const tileColA = (local_id.x * ColPerThreadA);`
			`uint const RowPerThreadB = (TileInner / 16u);`
			`uint const tileRowB = (local_id.y * RowPerThreadB);`
			`{`
			`uint t = 0u;`
			`while (true) {`
			`if (!((t < numTiles))) {`
			`break;`
			`}`
			`{`
			`uint innerRow = 0u;`
			`while (true) {`
			`if (!((innerRow < RowPerThread))) {`
			`break;`
			`}`
			`{`
			`uint innerCol = 0u;`
			`while (true) {`
			`if (!((innerCol < ColPerThreadA))) {`
			`break;`
			`}`
			`uint const inputRow = (tileRow + innerRow);`
			`uint const inputCol = (tileColA + innerCol);`
			`tint_symbol_4.arr[inputRow].arr[inputCol] = mm_readA(uniforms, firstMatrix, (globalRow + innerRow), ((t * TileInner) + inputCol));`
			`{`
			`innerCol = (innerCol + 1u);`
			`}`
			`}`
			`}`
			`{`
			`innerRow = (innerRow + 1u);`
			`}`
			`}`
			`}`
			`{`
			`uint innerRow = 0u;`
			`while (true) {`
			`if (!((innerRow < RowPerThreadB))) {`
			`break;`
			`}`
			`{`
			`uint innerCol = 0u;`
			`while (true) {`
			`if (!((innerCol < ColPerThread))) {`
			`break;`
			`}`
			`uint const inputRow = (tileRowB + innerRow);`
			`uint const inputCol = (tileCol + innerCol);`
			`tint_symbol_5.arr[innerCol].arr[inputCol] = mm_readB(uniforms, secondMatrix, ((t * TileInner) + inputRow), (globalCol + innerCol));`
			`{`
			`innerCol = (innerCol + 1u);`
			`}`
			`}`
			`}`
			`{`
			`innerRow = (innerRow + 1u);`
			`}`
			`}`
			`}`
			`threadgroup_barrier(mem_flags::mem_threadgroup);`
			`{`
			`uint k = 0u;`
			`while (true) {`
			`if (!((k < TileInner))) {`
			`break;`
			`}`
			`{`
			`uint inner = 0u;`
			`while (true) {`
			`if (!((inner < ColPerThread))) {`
			`break;`
			`}`
			`BCached.arr[inner] = tint_symbol_5.arr[k].arr[(tileCol + inner)];`
			`{`
			`inner = (inner + 1u);`
			`}`
			`}`
			`}`
			`{`
			`uint innerRow = 0u;`
			`while (true) {`
			`if (!((innerRow < RowPerThread))) {`
			`break;`
			`}`
			`ACached = tint_symbol_4.arr[(tileRow + innerRow)].arr[k];`
			`{`
			`uint innerCol = 0u;`
			`while (true) {`
			`if (!((innerCol < ColPerThread))) {`
			`break;`
			`}`
			`uint const index = ((innerRow * ColPerThread) + innerCol);`
			`acc.arr[index] = (acc.arr[index] + (ACached * BCached.arr[innerCol]));`
			`{`
			`innerCol = (innerCol + 1u);`
			`}`
			`}`
			`}`
			`{`
			`innerRow = (innerRow + 1u);`
			`}`
			`}`
			`}`
			`{`
			`k = (k + 1u);`
			`}`
			`}`
			`}`
			`threadgroup_barrier(mem_flags::mem_threadgroup);`
			`{`
			`t = (t + 1u);`
			`}`
			`}`
			`}`
			`{`
			`uint innerRow = 0u;`
			`while (true) {`
			`if (!((innerRow < RowPerThread))) {`
			`break;`
			`}`
			`{`
			`uint innerCol = 0u;`
			`while (true) {`
			`if (!((innerCol < ColPerThread))) {`
			`break;`
			`}`
			`uint const index = ((innerRow * ColPerThread) + innerCol);`
			`mm_write(uniforms, resultMatrix, (globalRow + innerRow), (globalCol + innerCol), acc.arr[index]);`
			`{`
			`innerCol = (innerCol + 1u);`
			`}`
			`}`
			`}`
			`{`
			`innerRow = (innerRow + 1u);`
			`}`
			`}`
			`}`
			`return;`
			`}`