benchmarks: Add a basic set of benchmarks
Add google benchmark to the DEPs. Implement a basic set of benchmarks for each of the writers and the WGSL parser. Add build rules for CMake. GN build rules TODO. Add a simple go tool (ported from Marl) to diff two benchmarks. Less noisy than the one provided by google benchmark. Bug: tint:1378 Change-Id: I73cf92c5d9fd2d3bfac8f264864fd774afbd5d01 Reviewed-on: https://dawn-review.googlesource.com/c/tint/+/76840 Kokoro: Kokoro <noreply+kokoro@google.com> Reviewed-by: Ryan Harrison <rharrison@chromium.org> Commit-Queue: Ben Clayton <bclayton@chromium.org>
This commit is contained in:
parent
dcb24cea41
commit
be2362b18c
|
@ -81,6 +81,7 @@ option_if_not_defined(TINT_BUILD_FUZZERS "Build fuzzers" OFF)
|
|||
option_if_not_defined(TINT_BUILD_SPIRV_TOOLS_FUZZER "Build SPIRV-Tools fuzzer" OFF)
|
||||
option_if_not_defined(TINT_BUILD_AST_FUZZER "Build AST fuzzer" OFF)
|
||||
option_if_not_defined(TINT_BUILD_REGEX_FUZZER "Build regex fuzzer" OFF)
|
||||
option_if_not_defined(TINT_BUILD_BENCHMARKS "Build benchmarks" OFF)
|
||||
option_if_not_defined(TINT_BUILD_TESTS "Build tests" ${TINT_BUILD_TESTS_DEFAULT})
|
||||
option_if_not_defined(TINT_BUILD_AS_OTHER_OS "Override OS detection to force building of *_other.cc files" OFF)
|
||||
option_if_not_defined(TINT_BUILD_REMOTE_COMPILE "Build the remote-compile tool for validating shaders on a remote machine" OFF)
|
||||
|
@ -111,6 +112,7 @@ message(STATUS "Tint build fuzzers: ${TINT_BUILD_FUZZERS}")
|
|||
message(STATUS "Tint build SPIRV-Tools fuzzer: ${TINT_BUILD_SPIRV_TOOLS_FUZZER}")
|
||||
message(STATUS "Tint build AST fuzzer: ${TINT_BUILD_AST_FUZZER}")
|
||||
message(STATUS "Tint build regex fuzzer: ${TINT_BUILD_REGEX_FUZZER}")
|
||||
message(STATUS "Tint build benchmarks: ${TINT_BUILD_BENCHMARKS}")
|
||||
message(STATUS "Tint build tests: ${TINT_BUILD_TESTS}")
|
||||
message(STATUS "Tint build with ASAN: ${TINT_ENABLE_ASAN}")
|
||||
message(STATUS "Tint build with MSAN: ${TINT_ENABLE_MSAN}")
|
||||
|
@ -254,7 +256,7 @@ if(${TINT_BUILD_DOCS})
|
|||
endif(DOXYGEN_FOUND)
|
||||
endif()
|
||||
|
||||
function(tint_default_compile_options TARGET)
|
||||
function(tint_core_compile_options TARGET)
|
||||
target_include_directories(${TARGET} PUBLIC "${TINT_ROOT_SOURCE_DIR}")
|
||||
target_include_directories(${TARGET} PUBLIC "${TINT_ROOT_SOURCE_DIR}/include")
|
||||
|
||||
|
@ -263,20 +265,48 @@ function(tint_default_compile_options TARGET)
|
|||
"${TINT_ROOT_SOURCE_DIR}/third_party/spirv-headers/include")
|
||||
endif()
|
||||
|
||||
target_compile_definitions(${TARGET} PUBLIC
|
||||
-DTINT_BUILD_SPV_READER=$<BOOL:${TINT_BUILD_SPV_READER}>)
|
||||
target_compile_definitions(${TARGET} PUBLIC
|
||||
-DTINT_BUILD_WGSL_READER=$<BOOL:${TINT_BUILD_WGSL_READER}>)
|
||||
target_compile_definitions(${TARGET} PUBLIC
|
||||
-DTINT_BUILD_GLSL_WRITER=$<BOOL:${TINT_BUILD_GLSL_WRITER}>)
|
||||
target_compile_definitions(${TARGET} PUBLIC
|
||||
-DTINT_BUILD_HLSL_WRITER=$<BOOL:${TINT_BUILD_HLSL_WRITER}>)
|
||||
target_compile_definitions(${TARGET} PUBLIC
|
||||
-DTINT_BUILD_MSL_WRITER=$<BOOL:${TINT_BUILD_MSL_WRITER}>)
|
||||
target_compile_definitions(${TARGET} PUBLIC
|
||||
-DTINT_BUILD_SPV_WRITER=$<BOOL:${TINT_BUILD_SPV_WRITER}>)
|
||||
target_compile_definitions(${TARGET} PUBLIC
|
||||
-DTINT_BUILD_WGSL_WRITER=$<BOOL:${TINT_BUILD_WGSL_WRITER}>)
|
||||
target_compile_definitions(${TARGET} PUBLIC -DTINT_BUILD_SPV_READER=$<BOOL:${TINT_BUILD_SPV_READER}>)
|
||||
target_compile_definitions(${TARGET} PUBLIC -DTINT_BUILD_WGSL_READER=$<BOOL:${TINT_BUILD_WGSL_READER}>)
|
||||
target_compile_definitions(${TARGET} PUBLIC -DTINT_BUILD_GLSL_WRITER=$<BOOL:${TINT_BUILD_GLSL_WRITER}>)
|
||||
target_compile_definitions(${TARGET} PUBLIC -DTINT_BUILD_HLSL_WRITER=$<BOOL:${TINT_BUILD_HLSL_WRITER}>)
|
||||
target_compile_definitions(${TARGET} PUBLIC -DTINT_BUILD_MSL_WRITER=$<BOOL:${TINT_BUILD_MSL_WRITER}>)
|
||||
target_compile_definitions(${TARGET} PUBLIC -DTINT_BUILD_SPV_WRITER=$<BOOL:${TINT_BUILD_SPV_WRITER}>)
|
||||
target_compile_definitions(${TARGET} PUBLIC -DTINT_BUILD_WGSL_WRITER=$<BOOL:${TINT_BUILD_WGSL_WRITER}>)
|
||||
|
||||
if (COMPILER_IS_LIKE_GNU)
|
||||
target_compile_options(${TARGET} PRIVATE
|
||||
-std=c++17
|
||||
-fno-exceptions
|
||||
-fno-rtti
|
||||
)
|
||||
|
||||
if (${TINT_ENABLE_MSAN})
|
||||
target_compile_options(${TARGET} PRIVATE -fsanitize=memory)
|
||||
target_link_options(${TARGET} PRIVATE -fsanitize=memory)
|
||||
elseif (${TINT_ENABLE_ASAN})
|
||||
target_compile_options(${TARGET} PRIVATE -fsanitize=address)
|
||||
target_link_options(${TARGET} PRIVATE -fsanitize=address)
|
||||
elseif (${TINT_ENABLE_UBSAN})
|
||||
target_compile_options(${TARGET} PRIVATE -fsanitize=undefined)
|
||||
target_link_options(${TARGET} PRIVATE -fsanitize=undefined)
|
||||
endif()
|
||||
endif(COMPILER_IS_LIKE_GNU)
|
||||
|
||||
if (TINT_EMIT_COVERAGE)
|
||||
if(CMAKE_CXX_COMPILER_ID MATCHES "GNU")
|
||||
target_compile_options(${TARGET} PRIVATE "--coverage")
|
||||
target_link_options(${TARGET} PRIVATE "gcov")
|
||||
elseif(CMAKE_CXX_COMPILER_ID MATCHES "Clang")
|
||||
target_compile_options(${TARGET} PRIVATE "-fprofile-instr-generate" "-fcoverage-mapping")
|
||||
target_link_options(${TARGET} PRIVATE "-fprofile-instr-generate" "-fcoverage-mapping")
|
||||
else()
|
||||
message(FATAL_ERROR "Coverage generation not supported for the ${CMAKE_CXX_COMPILER_ID} toolchain")
|
||||
endif()
|
||||
endif(TINT_EMIT_COVERAGE)
|
||||
endfunction()
|
||||
|
||||
function(tint_default_compile_options TARGET)
|
||||
tint_core_compile_options(${TARGET})
|
||||
|
||||
set(COMMON_GNU_OPTIONS
|
||||
-Wall
|
||||
|
@ -299,11 +329,8 @@ function(tint_default_compile_options TARGET)
|
|||
-Weverything
|
||||
)
|
||||
|
||||
if (${COMPILER_IS_LIKE_GNU})
|
||||
if (COMPILER_IS_LIKE_GNU)
|
||||
target_compile_options(${TARGET} PRIVATE
|
||||
-std=c++17
|
||||
-fno-exceptions
|
||||
-fno-rtti
|
||||
-pedantic-errors
|
||||
${COMMON_GNU_OPTIONS}
|
||||
)
|
||||
|
@ -314,30 +341,7 @@ function(tint_default_compile_options TARGET)
|
|||
${COMMON_CLANG_OPTIONS}
|
||||
)
|
||||
endif()
|
||||
|
||||
if (${TINT_ENABLE_MSAN})
|
||||
target_compile_options(${TARGET} PRIVATE -fsanitize=memory)
|
||||
target_link_options(${TARGET} PRIVATE -fsanitize=memory)
|
||||
elseif (${TINT_ENABLE_ASAN})
|
||||
target_compile_options(${TARGET} PRIVATE -fsanitize=address)
|
||||
target_link_options(${TARGET} PRIVATE -fsanitize=address)
|
||||
elseif (${TINT_ENABLE_UBSAN})
|
||||
target_compile_options(${TARGET} PRIVATE -fsanitize=undefined)
|
||||
target_link_options(${TARGET} PRIVATE -fsanitize=undefined)
|
||||
endif()
|
||||
endif()
|
||||
|
||||
if (${TINT_EMIT_COVERAGE})
|
||||
if(CMAKE_CXX_COMPILER_ID MATCHES "GNU")
|
||||
target_compile_options(${TARGET} PRIVATE "--coverage")
|
||||
target_link_options(${TARGET} PRIVATE "gcov")
|
||||
elseif(CMAKE_CXX_COMPILER_ID MATCHES "Clang")
|
||||
target_compile_options(${TARGET} PRIVATE "-fprofile-instr-generate" "-fcoverage-mapping")
|
||||
target_link_options(${TARGET} PRIVATE "-fprofile-instr-generate" "-fcoverage-mapping")
|
||||
else()
|
||||
message(FATAL_ERROR "Coverage generation not supported for the ${CMAKE_CXX_COMPILER_ID} toolchain")
|
||||
endif()
|
||||
endif()
|
||||
endif(COMPILER_IS_LIKE_GNU)
|
||||
|
||||
if (MSVC)
|
||||
# Specify /EHs for exception handling.
|
||||
|
@ -379,7 +383,6 @@ function(tint_default_compile_options TARGET)
|
|||
)
|
||||
endif()
|
||||
endif()
|
||||
|
||||
endfunction()
|
||||
|
||||
add_subdirectory(third_party)
|
||||
|
|
4
DEPS
4
DEPS
|
@ -10,6 +10,7 @@ vars = {
|
|||
'chromium_git': 'https://chromium.googlesource.com',
|
||||
'github': '/external/github.com',
|
||||
|
||||
'benchmark_revision': 'e991355c02b93fe17713efe04cbc2e278e00fdbd',
|
||||
'build_revision': '555c8b467c21e2c4b22d00e87e3faa0431df9ac2',
|
||||
'buildtools_revision': 'f78b4b9f33bd8ef9944d5ce643daff1c31880189',
|
||||
'catapult_revision': 'fa35beefb3429605035f98211ddb8750dee6a13d',
|
||||
|
@ -101,6 +102,9 @@ deps = {
|
|||
'third_party/catapult': Var('chromium_git') + '/catapult.git@' +
|
||||
Var('catapult_revision'),
|
||||
|
||||
'third_party/benchmark': Var('chromium_git') + Var('github') +
|
||||
'/google/benchmark.git@' + Var('benchmark_revision'),
|
||||
|
||||
'third_party/googletest': Var('chromium_git') + Var('github') +
|
||||
'/google/googletest.git@' + Var('googletest_revision'),
|
||||
|
||||
|
|
|
@ -56,13 +56,7 @@ bool ReadFile(const std::string& input_file, std::vector<T>* buffer) {
|
|||
}
|
||||
|
||||
fseek(file, 0, SEEK_END);
|
||||
auto tell_file_size = ftell(file);
|
||||
if (tell_file_size <= 0) {
|
||||
std::cerr << "Input file of incorrect size: " << input_file << std::endl;
|
||||
fclose(file);
|
||||
return {};
|
||||
}
|
||||
const auto file_size = static_cast<size_t>(tell_file_size);
|
||||
const auto file_size = static_cast<size_t>(ftell(file));
|
||||
if (0 != (file_size % sizeof(T))) {
|
||||
std::cerr << "File " << input_file
|
||||
<< " does not contain an integral number of objects: "
|
||||
|
|
|
@ -84,7 +84,8 @@ if [ "$BUILD_SYSTEM" == "cmake" ]; then
|
|||
|
||||
COMMON_CMAKE_FLAGS=""
|
||||
COMMON_CMAKE_FLAGS+=" -DCMAKE_BUILD_TYPE=${BUILD_TYPE}"
|
||||
COMMON_CMAKE_FLAGS+=" -DTINT_DOCS_WARN_AS_ERROR=ON"
|
||||
COMMON_CMAKE_FLAGS+=" -DTINT_DOCS_WARN_AS_ERROR=1"
|
||||
COMMON_CMAKE_FLAGS+=" -DTINT_BUILD_BENCHMARKS=1"
|
||||
|
||||
if [ "$BUILD_TOOLCHAIN" == "clang" ]; then
|
||||
using clang-10.0.0
|
||||
|
@ -155,9 +156,9 @@ if [ "$BUILD_SYSTEM" == "cmake" ]; then
|
|||
|
||||
status "Checking disabling all readers and writers also builds"
|
||||
show_cmds
|
||||
cmake ${SRC_DIR} ${CMAKE_FLAGS} ${COMMON_CMAKE_FLAGS} -DTINT_BUILD_SPV_READER=OFF -DTINT_BUILD_SPV_WRITER=OFF -DTINT_BUILD_WGSL_READER=OFF -DTINT_BUILD_WGSL_WRITER=OFF -DTINT_BUILD_MSL_WRITER=OFF -DTINT_BUILD_HLSL_WRITER=OFF
|
||||
cmake ${SRC_DIR} ${CMAKE_FLAGS} ${COMMON_CMAKE_FLAGS} -DTINT_BUILD_SPV_READER=OFF -DTINT_BUILD_SPV_WRITER=OFF -DTINT_BUILD_WGSL_READER=OFF -DTINT_BUILD_WGSL_WRITER=OFF -DTINT_BUILD_MSL_WRITER=OFF -DTINT_BUILD_HLSL_WRITER=OFF -DTINT_BUILD_BENCHMARKS=OFF
|
||||
cmake --build . -- --jobs=$(nproc)
|
||||
cmake ${SRC_DIR} ${CMAKE_FLAGS} ${COMMON_CMAKE_FLAGS} -DTINT_BUILD_SPV_READER=ON -DTINT_BUILD_SPV_WRITER=ON -DTINT_BUILD_WGSL_READER=ON -DTINT_BUILD_WGSL_WRITER=ON -DTINT_BUILD_MSL_WRITER=ON -DTINT_BUILD_HLSL_WRITER=ON
|
||||
cmake ${SRC_DIR} ${CMAKE_FLAGS} ${COMMON_CMAKE_FLAGS} -DTINT_BUILD_SPV_READER=ON -DTINT_BUILD_SPV_WRITER=ON -DTINT_BUILD_WGSL_READER=ON -DTINT_BUILD_WGSL_WRITER=ON -DTINT_BUILD_MSL_WRITER=ON -DTINT_BUILD_HLSL_WRITER=ON -DTINT_BUILD_BENCHMARKS=ON
|
||||
hide_cmds
|
||||
else
|
||||
status "Unsupported build system: $BUILD_SYSTEM"
|
||||
|
|
|
@ -116,7 +116,7 @@ call :status "Configuring build system"
|
|||
@echo on
|
||||
mkdir %BUILD_DIR%
|
||||
cd /d %BUILD_DIR%
|
||||
set COMMON_CMAKE_FLAGS=-DTINT_BUILD_DOCS=O -DCMAKE_BUILD_TYPE=%BUILD_TYPE%
|
||||
set COMMON_CMAKE_FLAGS=-DTINT_BUILD_DOCS=O -DTINT_BUILD_BENCHMARKS=1 -DCMAKE_BUILD_TYPE=%BUILD_TYPE%
|
||||
@echo off
|
||||
|
||||
call :status "Building tint"
|
||||
|
|
|
@ -437,13 +437,7 @@ bool ReadFile(const std::string& input_file, std::vector<T>* buffer) {
|
|||
}
|
||||
|
||||
fseek(file, 0, SEEK_END);
|
||||
uint64_t tell_file_size = static_cast<uint64_t>(ftell(file));
|
||||
if (tell_file_size <= 0) {
|
||||
std::cerr << "Input file of incorrect size: " << input_file << std::endl;
|
||||
fclose(file);
|
||||
return {};
|
||||
}
|
||||
const auto file_size = static_cast<size_t>(tell_file_size);
|
||||
const auto file_size = static_cast<size_t>(ftell(file));
|
||||
if (0 != (file_size % sizeof(T))) {
|
||||
std::cerr << "File " << input_file
|
||||
<< " does not contain an integral number of objects: "
|
||||
|
|
|
@ -598,7 +598,10 @@ if(${TINT_BUILD_SPV_READER} OR ${TINT_BUILD_SPV_WRITER})
|
|||
endif()
|
||||
endif()
|
||||
|
||||
if(${TINT_BUILD_TESTS})
|
||||
################################################################################
|
||||
# Tests
|
||||
################################################################################
|
||||
if(TINT_BUILD_TESTS)
|
||||
set(TINT_TEST_SRCS
|
||||
ast/alias_test.cc
|
||||
ast/array_test.cc
|
||||
|
@ -1114,6 +1117,7 @@ if(${TINT_BUILD_TESTS})
|
|||
endif()
|
||||
|
||||
add_executable(tint_unittests ${TINT_TEST_SRCS})
|
||||
set_target_properties(${target} PROPERTIES FOLDER "Tests")
|
||||
|
||||
if(NOT MSVC)
|
||||
target_compile_options(tint_unittests PRIVATE
|
||||
|
@ -1133,4 +1137,41 @@ if(${TINT_BUILD_TESTS})
|
|||
endif()
|
||||
|
||||
add_test(NAME tint_unittests COMMAND tint_unittests)
|
||||
endif()
|
||||
endif(TINT_BUILD_TESTS)
|
||||
|
||||
################################################################################
|
||||
# Benchmarks
|
||||
################################################################################
|
||||
if(TINT_BUILD_BENCHMARKS)
|
||||
if(NOT TINT_BUILD_WGSL_READER)
|
||||
message(FATAL_ERROR "TINT_BUILD_BENCHMARKS requires TINT_BUILD_WGSL_READER")
|
||||
endif()
|
||||
|
||||
set(TINT_BENCHMARK_SRC
|
||||
"benchmark/benchmark.cc"
|
||||
"reader/wgsl/parser_bench.cc"
|
||||
)
|
||||
|
||||
if (${TINT_BUILD_GLSL_WRITER})
|
||||
list(APPEND TINT_BENCHMARK_SRC writer/glsl/generator_bench.cc)
|
||||
endif()
|
||||
if (${TINT_BUILD_HLSL_WRITER})
|
||||
list(APPEND TINT_BENCHMARK_SRC writer/hlsl/generator_bench.cc)
|
||||
endif()
|
||||
if (${TINT_BUILD_MSL_WRITER})
|
||||
list(APPEND TINT_BENCHMARK_SRC writer/msl/generator_bench.cc)
|
||||
endif()
|
||||
if (${TINT_BUILD_SPV_WRITER})
|
||||
list(APPEND TINT_BENCHMARK_SRC writer/spirv/generator_bench.cc)
|
||||
endif()
|
||||
if (${TINT_BUILD_WGSL_WRITER})
|
||||
list(APPEND TINT_BENCHMARK_SRC writer/wgsl/generator_bench.cc)
|
||||
endif()
|
||||
|
||||
add_executable(tint-benchmark ${TINT_BENCHMARK_SRC})
|
||||
set_target_properties(${target} PROPERTIES FOLDER "Benchmarks")
|
||||
|
||||
tint_core_compile_options(tint-benchmark)
|
||||
|
||||
target_link_libraries(tint-benchmark PRIVATE benchmark::benchmark libtint)
|
||||
endif(TINT_BUILD_BENCHMARKS)
|
||||
|
|
|
@ -0,0 +1,123 @@
|
|||
// Copyright 2022 The Tint Authors.
|
||||
//
|
||||
// Licensed under the Apache License, Version 2.0 (the "License");
|
||||
// you may not use this file except in compliance with the License.
|
||||
// You may obtain a copy of the License at
|
||||
//
|
||||
// http://www.apache.org/licenses/LICENSE-2.0
|
||||
//
|
||||
// Unless required by applicable law or agreed to in writing, software
|
||||
// distributed under the License is distributed on an "AS IS" BASIS,
|
||||
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
// See the License for the specific language governing permissions and
|
||||
// limitations under the License.
|
||||
|
||||
#include "src/benchmark/benchmark.h"
|
||||
|
||||
#include <filesystem>
|
||||
#include <sstream>
|
||||
#include <utility>
|
||||
#include <vector>
|
||||
|
||||
namespace tint::benchmark {
|
||||
namespace {
|
||||
|
||||
std::filesystem::path kInputFileDir;
|
||||
|
||||
/// Copies the content from the file named `input_file` to `buffer`,
|
||||
/// assuming each element in the file is of type `T`. If any error occurs,
|
||||
/// writes error messages to the standard error stream and returns false.
|
||||
/// Assumes the size of a `T` object is divisible by its required alignment.
|
||||
/// @returns true if we successfully read the file.
|
||||
template <typename T>
|
||||
std::variant<std::vector<T>, Error> ReadFile(const std::string& input_file) {
|
||||
FILE* file = nullptr;
|
||||
#if defined(_MSC_VER)
|
||||
fopen_s(&file, input_file.c_str(), "rb");
|
||||
#else
|
||||
file = fopen(input_file.c_str(), "rb");
|
||||
#endif
|
||||
if (!file) {
|
||||
return Error{"Failed to open " + input_file};
|
||||
}
|
||||
|
||||
fseek(file, 0, SEEK_END);
|
||||
const auto file_size = static_cast<size_t>(ftell(file));
|
||||
if (0 != (file_size % sizeof(T))) {
|
||||
std::stringstream err;
|
||||
err << "File " << input_file
|
||||
<< " does not contain an integral number of objects: " << file_size
|
||||
<< " bytes in the file, require " << sizeof(T) << " bytes per object";
|
||||
fclose(file);
|
||||
return Error{err.str()};
|
||||
}
|
||||
fseek(file, 0, SEEK_SET);
|
||||
|
||||
std::vector<T> buffer;
|
||||
buffer.resize(file_size / sizeof(T));
|
||||
|
||||
size_t bytes_read = fread(buffer.data(), 1, file_size, file);
|
||||
fclose(file);
|
||||
if (bytes_read != file_size) {
|
||||
return Error{"Failed to read " + input_file};
|
||||
}
|
||||
|
||||
return buffer;
|
||||
}
|
||||
|
||||
bool FindBenchmarkInputDir() {
|
||||
// Attempt to find the benchmark input files by searching up from the current
|
||||
// working directory.
|
||||
auto path = std::filesystem::current_path();
|
||||
while (std::filesystem::is_directory(path)) {
|
||||
auto test = path / "test" / "benchmark";
|
||||
if (std::filesystem::is_directory(test)) {
|
||||
kInputFileDir = test;
|
||||
return true;
|
||||
}
|
||||
auto parent = path.parent_path();
|
||||
if (path == parent) {
|
||||
break;
|
||||
}
|
||||
path = parent;
|
||||
}
|
||||
return false;
|
||||
}
|
||||
|
||||
} // namespace
|
||||
|
||||
std::variant<tint::Source::File, Error> LoadInputFile(std::string name) {
|
||||
auto path = (kInputFileDir / name).string();
|
||||
auto data = ReadFile<uint8_t>(path);
|
||||
if (auto* buf = std::get_if<std::vector<uint8_t>>(&data)) {
|
||||
return tint::Source::File(path, std::string(buf->begin(), buf->end()));
|
||||
}
|
||||
return std::get<Error>(data);
|
||||
}
|
||||
|
||||
std::variant<ProgramAndFile, Error> LoadProgram(std::string name) {
|
||||
auto res = benchmark::LoadInputFile(name);
|
||||
if (auto err = std::get_if<benchmark::Error>(&res)) {
|
||||
return *err;
|
||||
}
|
||||
auto& file = std::get<Source::File>(res);
|
||||
auto program = reader::wgsl::Parse(&file);
|
||||
if (program.Diagnostics().contains_errors()) {
|
||||
return Error{program.Diagnostics().str()};
|
||||
}
|
||||
return ProgramAndFile{std::move(program), std::move(file)};
|
||||
}
|
||||
|
||||
} // namespace tint::benchmark
|
||||
|
||||
int main(int argc, char** argv) {
|
||||
::benchmark::Initialize(&argc, argv);
|
||||
if (::benchmark::ReportUnrecognizedArguments(argc, argv)) {
|
||||
return 1;
|
||||
}
|
||||
if (!tint::benchmark::FindBenchmarkInputDir()) {
|
||||
std::cerr << "failed to locate benchmark input files" << std::endl;
|
||||
return 1;
|
||||
}
|
||||
::benchmark::RunSpecifiedBenchmarks();
|
||||
}
|
|
@ -0,0 +1,69 @@
|
|||
// Copyright 2022 The Tint Authors.
|
||||
//
|
||||
// Licensed under the Apache License, Version 2.0 (the "License");
|
||||
// you may not use this file except in compliance with the License.
|
||||
// You may obtain a copy of the License at
|
||||
//
|
||||
// http://www.apache.org/licenses/LICENSE-2.0
|
||||
//
|
||||
// Unless required by applicable law or agreed to in writing, software
|
||||
// distributed under the License is distributed on an "AS IS" BASIS,
|
||||
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
// See the License for the specific language governing permissions and
|
||||
// limitations under the License.
|
||||
|
||||
#ifndef SRC_BENCHMARK_BENCHMARK_H_
|
||||
#define SRC_BENCHMARK_BENCHMARK_H_
|
||||
|
||||
#include <memory>
|
||||
#include <string>
|
||||
#include <variant> // NOLINT: Found C system header after C++ system header.
|
||||
|
||||
#include "benchmark/benchmark.h"
|
||||
#include "src/utils/concat.h"
|
||||
#include "tint/tint.h"
|
||||
|
||||
namespace tint::benchmark {
|
||||
|
||||
/// Error indicates an operation did not complete successfully.
|
||||
struct Error {
|
||||
/// The error message.
|
||||
std::string msg;
|
||||
};
|
||||
|
||||
/// ProgramAndFile holds a Program and a Source::File.
|
||||
struct ProgramAndFile {
|
||||
/// The tint program parsed from file.
|
||||
Program program;
|
||||
/// The source file
|
||||
Source::File file;
|
||||
};
|
||||
|
||||
/// LoadInputFile attempts to load a benchmark input file with the given file
|
||||
/// name.
|
||||
/// @param name the file name
|
||||
/// @returns either the loaded Source::File or an Error
|
||||
std::variant<Source::File, Error> LoadInputFile(std::string name);
|
||||
|
||||
/// LoadInputFile attempts to load a benchmark input program with the given file
|
||||
/// name.
|
||||
/// @param name the file name
|
||||
/// @returns either the loaded Program or an Error
|
||||
std::variant<ProgramAndFile, Error> LoadProgram(std::string name);
|
||||
|
||||
/// Declares a benchmark with the given function and WGSL file name
|
||||
#define TINT_BENCHMARK_WGSL_PROGRAM(FUNC, WGSL_NAME) \
|
||||
BENCHMARK_CAPTURE(FUNC, WGSL_NAME, WGSL_NAME);
|
||||
|
||||
/// Declares a set of benchmarks for the given function using a list of WGSL
|
||||
/// files in `<tint>/test/benchmark`.
|
||||
#define TINT_BENCHMARK_WGSL_PROGRAMS(FUNC) \
|
||||
TINT_BENCHMARK_WGSL_PROGRAM(FUNC, "empty.wgsl"); \
|
||||
TINT_BENCHMARK_WGSL_PROGRAM(FUNC, "particles.wgsl"); \
|
||||
TINT_BENCHMARK_WGSL_PROGRAM(FUNC, "simple_fragment.wgsl"); \
|
||||
TINT_BENCHMARK_WGSL_PROGRAM(FUNC, "simple_vertex.wgsl"); \
|
||||
TINT_BENCHMARK_WGSL_PROGRAM(FUNC, "simple_compute.wgsl");
|
||||
|
||||
} // namespace tint::benchmark
|
||||
|
||||
#endif // SRC_BENCHMARK_BENCHMARK_H_
|
|
@ -0,0 +1,40 @@
|
|||
// Copyright 2022 The Tint Authors.
|
||||
//
|
||||
// Licensed under the Apache License, Version 2.0 (the "License");
|
||||
// you may not use this file except in compliance with the License.
|
||||
// You may obtain a copy of the License at
|
||||
//
|
||||
// http://www.apache.org/licenses/LICENSE-2.0
|
||||
//
|
||||
// Unless required by applicable law or agreed to in writing, software
|
||||
// distributed under the License is distributed on an "AS IS" BASIS,
|
||||
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
// See the License for the specific language governing permissions and
|
||||
// limitations under the License.
|
||||
|
||||
#include <string>
|
||||
|
||||
#include "src/benchmark/benchmark.h"
|
||||
|
||||
namespace tint::reader::wgsl {
|
||||
namespace {
|
||||
|
||||
void ParseWGSL(::benchmark::State& state, std::string input_name) {
|
||||
auto res = benchmark::LoadInputFile(input_name);
|
||||
if (auto err = std::get_if<benchmark::Error>(&res)) {
|
||||
state.SkipWithError(err->msg.c_str());
|
||||
return;
|
||||
}
|
||||
auto& file = std::get<Source::File>(res);
|
||||
for (auto _ : state) {
|
||||
auto res = Parse(&file);
|
||||
if (res.Diagnostics().contains_errors()) {
|
||||
state.SkipWithError(res.Diagnostics().str().c_str());
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
TINT_BENCHMARK_WGSL_PROGRAMS(ParseWGSL);
|
||||
|
||||
} // namespace
|
||||
} // namespace tint::reader::wgsl
|
|
@ -0,0 +1,50 @@
|
|||
// Copyright 2022 The Tint Authors.
|
||||
//
|
||||
// Licensed under the Apache License, Version 2.0 (the "License");
|
||||
// you may not use this file except in compliance with the License.
|
||||
// You may obtain a copy of the License at
|
||||
//
|
||||
// http://www.apache.org/licenses/LICENSE-2.0
|
||||
//
|
||||
// Unless required by applicable law or agreed to in writing, software
|
||||
// distributed under the License is distributed on an "AS IS" BASIS,
|
||||
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
// See the License for the specific language governing permissions and
|
||||
// limitations under the License.
|
||||
|
||||
#include <string>
|
||||
|
||||
#include "src/ast/module.h"
|
||||
#include "src/benchmark/benchmark.h"
|
||||
|
||||
namespace tint::writer::glsl {
|
||||
namespace {
|
||||
|
||||
void GenerateGLSL(::benchmark::State& state, std::string input_name) {
|
||||
auto res = benchmark::LoadProgram(input_name);
|
||||
if (auto err = std::get_if<benchmark::Error>(&res)) {
|
||||
state.SkipWithError(err->msg.c_str());
|
||||
return;
|
||||
}
|
||||
auto& program = std::get<benchmark::ProgramAndFile>(res).program;
|
||||
std::vector<std::string> entry_points;
|
||||
for (auto& fn : program.AST().Functions()) {
|
||||
if (fn->IsEntryPoint()) {
|
||||
entry_points.emplace_back(program.Symbols().NameFor(fn->symbol));
|
||||
}
|
||||
}
|
||||
|
||||
for (auto _ : state) {
|
||||
for (auto& ep : entry_points) {
|
||||
auto res = Generate(&program, {}, ep);
|
||||
if (!res.error.empty()) {
|
||||
state.SkipWithError(res.error.c_str());
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
TINT_BENCHMARK_WGSL_PROGRAMS(GenerateGLSL);
|
||||
|
||||
} // namespace
|
||||
} // namespace tint::writer::glsl
|
|
@ -0,0 +1,40 @@
|
|||
// Copyright 2022 The Tint Authors.
|
||||
//
|
||||
// Licensed under the Apache License, Version 2.0 (the "License");
|
||||
// you may not use this file except in compliance with the License.
|
||||
// You may obtain a copy of the License at
|
||||
//
|
||||
// http://www.apache.org/licenses/LICENSE-2.0
|
||||
//
|
||||
// Unless required by applicable law or agreed to in writing, software
|
||||
// distributed under the License is distributed on an "AS IS" BASIS,
|
||||
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
// See the License for the specific language governing permissions and
|
||||
// limitations under the License.
|
||||
|
||||
#include <string>
|
||||
|
||||
#include "src/benchmark/benchmark.h"
|
||||
|
||||
namespace tint::writer::hlsl {
|
||||
namespace {
|
||||
|
||||
void GenerateHLSL(::benchmark::State& state, std::string input_name) {
|
||||
auto res = benchmark::LoadProgram(input_name);
|
||||
if (auto err = std::get_if<benchmark::Error>(&res)) {
|
||||
state.SkipWithError(err->msg.c_str());
|
||||
return;
|
||||
}
|
||||
auto& program = std::get<benchmark::ProgramAndFile>(res).program;
|
||||
for (auto _ : state) {
|
||||
auto res = Generate(&program, {});
|
||||
if (!res.error.empty()) {
|
||||
state.SkipWithError(res.error.c_str());
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
TINT_BENCHMARK_WGSL_PROGRAMS(GenerateHLSL);
|
||||
|
||||
} // namespace
|
||||
} // namespace tint::writer::hlsl
|
|
@ -0,0 +1,40 @@
|
|||
// Copyright 2022 The Tint Authors.
|
||||
//
|
||||
// Licensed under the Apache License, Version 2.0 (the "License");
|
||||
// you may not use this file except in compliance with the License.
|
||||
// You may obtain a copy of the License at
|
||||
//
|
||||
// http://www.apache.org/licenses/LICENSE-2.0
|
||||
//
|
||||
// Unless required by applicable law or agreed to in writing, software
|
||||
// distributed under the License is distributed on an "AS IS" BASIS,
|
||||
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
// See the License for the specific language governing permissions and
|
||||
// limitations under the License.
|
||||
|
||||
#include <string>
|
||||
|
||||
#include "src/benchmark/benchmark.h"
|
||||
|
||||
namespace tint::writer::msl {
|
||||
namespace {
|
||||
|
||||
void GenerateMSL(::benchmark::State& state, std::string input_name) {
|
||||
auto res = benchmark::LoadProgram(input_name);
|
||||
if (auto err = std::get_if<benchmark::Error>(&res)) {
|
||||
state.SkipWithError(err->msg.c_str());
|
||||
return;
|
||||
}
|
||||
auto& program = std::get<benchmark::ProgramAndFile>(res).program;
|
||||
for (auto _ : state) {
|
||||
auto res = Generate(&program, {});
|
||||
if (!res.error.empty()) {
|
||||
state.SkipWithError(res.error.c_str());
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
TINT_BENCHMARK_WGSL_PROGRAMS(GenerateMSL);
|
||||
|
||||
} // namespace
|
||||
} // namespace tint::writer::msl
|
|
@ -0,0 +1,40 @@
|
|||
// Copyright 2022 The Tint Authors.
|
||||
//
|
||||
// Licensed under the Apache License, Version 2.0 (the "License");
|
||||
// you may not use this file except in compliance with the License.
|
||||
// You may obtain a copy of the License at
|
||||
//
|
||||
// http://www.apache.org/licenses/LICENSE-2.0
|
||||
//
|
||||
// Unless required by applicable law or agreed to in writing, software
|
||||
// distributed under the License is distributed on an "AS IS" BASIS,
|
||||
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
// See the License for the specific language governing permissions and
|
||||
// limitations under the License.
|
||||
|
||||
#include <string>
|
||||
|
||||
#include "src/benchmark/benchmark.h"
|
||||
|
||||
namespace tint::writer::spirv {
|
||||
namespace {
|
||||
|
||||
void GenerateSPIRV(::benchmark::State& state, std::string input_name) {
|
||||
auto res = benchmark::LoadProgram(input_name);
|
||||
if (auto err = std::get_if<benchmark::Error>(&res)) {
|
||||
state.SkipWithError(err->msg.c_str());
|
||||
return;
|
||||
}
|
||||
auto& program = std::get<benchmark::ProgramAndFile>(res).program;
|
||||
for (auto _ : state) {
|
||||
auto res = Generate(&program, {});
|
||||
if (!res.error.empty()) {
|
||||
state.SkipWithError(res.error.c_str());
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
TINT_BENCHMARK_WGSL_PROGRAMS(GenerateSPIRV);
|
||||
|
||||
} // namespace
|
||||
} // namespace tint::writer::spirv
|
|
@ -0,0 +1,40 @@
|
|||
// Copyright 2022 The Tint Authors.
|
||||
//
|
||||
// Licensed under the Apache License, Version 2.0 (the "License");
|
||||
// you may not use this file except in compliance with the License.
|
||||
// You may obtain a copy of the License at
|
||||
//
|
||||
// http://www.apache.org/licenses/LICENSE-2.0
|
||||
//
|
||||
// Unless required by applicable law or agreed to in writing, software
|
||||
// distributed under the License is distributed on an "AS IS" BASIS,
|
||||
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
// See the License for the specific language governing permissions and
|
||||
// limitations under the License.
|
||||
|
||||
#include <string>
|
||||
|
||||
#include "src/benchmark/benchmark.h"
|
||||
|
||||
namespace tint::writer::wgsl {
|
||||
namespace {
|
||||
|
||||
void GenerateWGSL(::benchmark::State& state, std::string input_name) {
|
||||
auto res = benchmark::LoadProgram(input_name);
|
||||
if (auto err = std::get_if<benchmark::Error>(&res)) {
|
||||
state.SkipWithError(err->msg.c_str());
|
||||
return;
|
||||
}
|
||||
auto& program = std::get<benchmark::ProgramAndFile>(res).program;
|
||||
for (auto _ : state) {
|
||||
auto res = Generate(&program, {});
|
||||
if (!res.error.empty()) {
|
||||
state.SkipWithError(res.error.c_str());
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
TINT_BENCHMARK_WGSL_PROGRAMS(GenerateWGSL);
|
||||
|
||||
} // namespace
|
||||
} // namespace tint::writer::wgsl
|
|
@ -0,0 +1,4 @@
|
|||
[numthreads(1, 1, 1)]
|
||||
void unused_entry_point() {
|
||||
return;
|
||||
}
|
|
@ -0,0 +1,3 @@
|
|||
#include <metal_stdlib>
|
||||
|
||||
using namespace metal;
|
|
@ -0,0 +1,16 @@
|
|||
; SPIR-V
|
||||
; Version: 1.3
|
||||
; Generator: Google Tint Compiler; 0
|
||||
; Bound: 5
|
||||
; Schema: 0
|
||||
OpCapability Shader
|
||||
OpMemoryModel Logical GLSL450
|
||||
OpEntryPoint GLCompute %unused_entry_point "unused_entry_point"
|
||||
OpExecutionMode %unused_entry_point LocalSize 1 1 1
|
||||
OpName %unused_entry_point "unused_entry_point"
|
||||
%void = OpTypeVoid
|
||||
%1 = OpTypeFunction %void
|
||||
%unused_entry_point = OpFunction %void None %1
|
||||
%4 = OpLabel
|
||||
OpReturn
|
||||
OpFunctionEnd
|
|
@ -0,0 +1,183 @@
|
|||
////////////////////////////////////////////////////////////////////////////////
|
||||
// Utilities
|
||||
////////////////////////////////////////////////////////////////////////////////
|
||||
var<private> rand_seed : vec2<f32>;
|
||||
|
||||
fn rand() -> f32 {
|
||||
rand_seed.x = fract(cos(dot(rand_seed, vec2<f32>(23.14077926, 232.61690225))) * 136.8168);
|
||||
rand_seed.y = fract(cos(dot(rand_seed, vec2<f32>(54.47856553, 345.84153136))) * 534.7645);
|
||||
return rand_seed.y;
|
||||
}
|
||||
|
||||
////////////////////////////////////////////////////////////////////////////////
|
||||
// Vertex shader
|
||||
////////////////////////////////////////////////////////////////////////////////
|
||||
struct RenderParams {
|
||||
modelViewProjectionMatrix : mat4x4<f32>;
|
||||
right : vec3<f32>;
|
||||
up : vec3<f32>;
|
||||
};
|
||||
[[binding(0), group(0)]] var<uniform> render_params : RenderParams;
|
||||
|
||||
struct VertexInput {
|
||||
[[location(0)]] position : vec3<f32>;
|
||||
[[location(1)]] color : vec4<f32>;
|
||||
[[location(2)]] quad_pos : vec2<f32>; // -1..+1
|
||||
};
|
||||
|
||||
struct VertexOutput {
|
||||
[[builtin(position)]] position : vec4<f32>;
|
||||
[[location(0)]] color : vec4<f32>;
|
||||
[[location(1)]] quad_pos : vec2<f32>; // -1..+1
|
||||
};
|
||||
|
||||
[[stage(vertex)]]
|
||||
fn vs_main(in : VertexInput) -> VertexOutput {
|
||||
var quad_pos = mat2x3<f32>(render_params.right, render_params.up) * in.quad_pos;
|
||||
var position = in.position + quad_pos * 0.01;
|
||||
var out : VertexOutput;
|
||||
out.position = render_params.modelViewProjectionMatrix * vec4<f32>(position, 1.0);
|
||||
out.color = in.color;
|
||||
out.quad_pos = in.quad_pos;
|
||||
return out;
|
||||
}
|
||||
|
||||
////////////////////////////////////////////////////////////////////////////////
|
||||
// Fragment shader
|
||||
////////////////////////////////////////////////////////////////////////////////
|
||||
[[stage(fragment)]]
|
||||
fn fs_main(in : VertexOutput) -> [[location(0)]] vec4<f32> {
|
||||
var color = in.color;
|
||||
// Apply a circular particle alpha mask
|
||||
color.a = color.a * max(1.0 - length(in.quad_pos), 0.0);
|
||||
return color;
|
||||
}
|
||||
|
||||
////////////////////////////////////////////////////////////////////////////////
|
||||
// Simulation Compute shader
|
||||
////////////////////////////////////////////////////////////////////////////////
|
||||
struct SimulationParams {
|
||||
deltaTime : f32;
|
||||
seed : vec4<f32>;
|
||||
};
|
||||
|
||||
struct Particle {
|
||||
position : vec3<f32>;
|
||||
lifetime : f32;
|
||||
color : vec4<f32>;
|
||||
velocity : vec3<f32>;
|
||||
};
|
||||
|
||||
struct Particles {
|
||||
particles : array<Particle>;
|
||||
};
|
||||
|
||||
[[binding(0), group(0)]] var<uniform> sim_params : SimulationParams;
|
||||
[[binding(1), group(0)]] var<storage, read_write> data : Particles;
|
||||
[[binding(2), group(0)]] var texture : texture_2d<f32>;
|
||||
|
||||
[[stage(compute), workgroup_size(64)]]
|
||||
fn simulate([[builtin(global_invocation_id)]] GlobalInvocationID : vec3<u32>) {
|
||||
rand_seed = (sim_params.seed.xy + vec2<f32>(GlobalInvocationID.xy)) * sim_params.seed.zw;
|
||||
|
||||
let idx = GlobalInvocationID.x;
|
||||
var particle = data.particles[idx];
|
||||
|
||||
// Apply gravity
|
||||
particle.velocity.z = particle.velocity.z - sim_params.deltaTime * 0.5;
|
||||
|
||||
// Basic velocity integration
|
||||
particle.position = particle.position + sim_params.deltaTime * particle.velocity;
|
||||
|
||||
// Age each particle. Fade out before vanishing.
|
||||
particle.lifetime = particle.lifetime - sim_params.deltaTime;
|
||||
particle.color.a = smoothStep(0.0, 0.5, particle.lifetime);
|
||||
|
||||
// If the lifetime has gone negative, then the particle is dead and should be
|
||||
// respawned.
|
||||
if (particle.lifetime < 0.0) {
|
||||
// Use the probability map to find where the particle should be spawned.
|
||||
// Starting with the 1x1 mip level.
|
||||
var coord = vec2<i32>(0, 0);
|
||||
for (var level = textureNumLevels(texture) - 1; level > 0; level = level - 1) {
|
||||
// Load the probability value from the mip-level
|
||||
// Generate a random number and using the probabilty values, pick the
|
||||
// next texel in the next largest mip level:
|
||||
//
|
||||
// 0.0 probabilites.r probabilites.g probabilites.b 1.0
|
||||
// | | | | |
|
||||
// | TOP-LEFT | TOP-RIGHT | BOTTOM-LEFT | BOTTOM_RIGHT |
|
||||
//
|
||||
let probabilites = textureLoad(texture, coord, level);
|
||||
let value = vec4<f32>(rand());
|
||||
let mask = (value >= vec4<f32>(0.0, probabilites.xyz)) & (value < probabilites);
|
||||
coord = coord * 2;
|
||||
coord.x = coord.x + select(0, 1, any(mask.yw)); // x y
|
||||
coord.y = coord.y + select(0, 1, any(mask.zw)); // z w
|
||||
}
|
||||
let uv = vec2<f32>(coord) / vec2<f32>(textureDimensions(texture));
|
||||
particle.position = vec3<f32>((uv - 0.5) * 3.0 * vec2<f32>(1.0, -1.0), 0.0);
|
||||
particle.color = textureLoad(texture, coord, 0);
|
||||
particle.velocity.x = (rand() - 0.5) * 0.1;
|
||||
particle.velocity.y = (rand() - 0.5) * 0.1;
|
||||
particle.velocity.z = rand() * 0.3;
|
||||
particle.lifetime = 0.5 + rand() * 2.0;
|
||||
}
|
||||
|
||||
// Store the new particle value
|
||||
data.particles[idx] = particle;
|
||||
}
|
||||
|
||||
struct UBO {
|
||||
width : u32;
|
||||
};
|
||||
|
||||
struct Buffer {
|
||||
weights : array<f32>;
|
||||
};
|
||||
|
||||
[[binding(3), group(0)]] var<uniform> ubo : UBO;
|
||||
[[binding(4), group(0)]] var<storage, read> buf_in : Buffer;
|
||||
[[binding(5), group(0)]] var<storage, read_write> buf_out : Buffer;
|
||||
[[binding(6), group(0)]] var tex_in : texture_2d<f32>;
|
||||
[[binding(7), group(0)]] var tex_out : texture_storage_2d<rgba8unorm, write>;
|
||||
|
||||
////////////////////////////////////////////////////////////////////////////////
|
||||
// import_level
|
||||
//
|
||||
// Loads the alpha channel from a texel of the source image, and writes it to
|
||||
// the buf_out.weights.
|
||||
////////////////////////////////////////////////////////////////////////////////
|
||||
[[stage(compute), workgroup_size(64)]]
|
||||
fn import_level([[builtin(global_invocation_id)]] coord : vec3<u32>) {
|
||||
_ = &buf_in;
|
||||
let offset = coord.x + coord.y * ubo.width;
|
||||
buf_out.weights[offset] = textureLoad(tex_in, vec2<i32>(coord.xy), 0).w;
|
||||
}
|
||||
|
||||
////////////////////////////////////////////////////////////////////////////////
|
||||
// export_level
|
||||
//
|
||||
// Loads 4 f32 weight values from buf_in.weights, and stores summed value into
|
||||
// buf_out.weights, along with the calculated 'probabilty' vec4 values into the
|
||||
// mip level of tex_out. See simulate() in particle.wgsl to understand the
|
||||
// probability logic.
|
||||
////////////////////////////////////////////////////////////////////////////////
|
||||
[[stage(compute), workgroup_size(64)]]
|
||||
fn export_level([[builtin(global_invocation_id)]] coord : vec3<u32>) {
|
||||
if (all(coord.xy < vec2<u32>(textureDimensions(tex_out)))) {
|
||||
let dst_offset = coord.x + coord.y * ubo.width;
|
||||
let src_offset = coord.x*2u + coord.y*2u * ubo.width;
|
||||
|
||||
let a = buf_in.weights[src_offset + 0u];
|
||||
let b = buf_in.weights[src_offset + 1u];
|
||||
let c = buf_in.weights[src_offset + 0u + ubo.width];
|
||||
let d = buf_in.weights[src_offset + 1u + ubo.width];
|
||||
let sum = dot(vec4<f32>(a, b, c, d), vec4<f32>(1.0));
|
||||
|
||||
buf_out.weights[dst_offset] = sum / 4.0;
|
||||
|
||||
let probabilities = vec4<f32>(a, a+b, a+b+c, sum) / max(sum, 0.0001);
|
||||
textureStore(tex_out, vec2<i32>(coord.xy), probabilities);
|
||||
}
|
||||
}
|
|
@ -0,0 +1,204 @@
|
|||
static float2 rand_seed = float2(0.0f, 0.0f);
|
||||
|
||||
float rand() {
|
||||
rand_seed.x = frac((cos(dot(rand_seed, float2(23.140779495f, 232.616897583f))) * 136.816802979f));
|
||||
rand_seed.y = frac((cos(dot(rand_seed, float2(54.478565216f, 345.841522217f))) * 534.764526367f));
|
||||
return rand_seed.y;
|
||||
}
|
||||
|
||||
cbuffer cbuffer_render_params : register(b0, space0) {
|
||||
uint4 render_params[6];
|
||||
};
|
||||
|
||||
struct VertexInput {
|
||||
float3 position;
|
||||
float4 color;
|
||||
float2 quad_pos;
|
||||
};
|
||||
struct VertexOutput {
|
||||
float4 position;
|
||||
float4 color;
|
||||
float2 quad_pos;
|
||||
};
|
||||
struct tint_symbol_5 {
|
||||
float3 position : TEXCOORD0;
|
||||
float4 color : TEXCOORD1;
|
||||
float2 quad_pos : TEXCOORD2;
|
||||
};
|
||||
struct tint_symbol_6 {
|
||||
float4 color : TEXCOORD0;
|
||||
float2 quad_pos : TEXCOORD1;
|
||||
float4 position : SV_Position;
|
||||
};
|
||||
|
||||
float4x4 tint_symbol_17(uint4 buffer[6], uint offset) {
|
||||
const uint scalar_offset = ((offset + 0u)) / 4;
|
||||
const uint scalar_offset_1 = ((offset + 16u)) / 4;
|
||||
const uint scalar_offset_2 = ((offset + 32u)) / 4;
|
||||
const uint scalar_offset_3 = ((offset + 48u)) / 4;
|
||||
return float4x4(asfloat(buffer[scalar_offset / 4]), asfloat(buffer[scalar_offset_1 / 4]), asfloat(buffer[scalar_offset_2 / 4]), asfloat(buffer[scalar_offset_3 / 4]));
|
||||
}
|
||||
|
||||
VertexOutput vs_main_inner(VertexInput tint_symbol) {
|
||||
float3 quad_pos = mul(tint_symbol.quad_pos, float2x3(asfloat(render_params[4].xyz), asfloat(render_params[5].xyz)));
|
||||
float3 position = (tint_symbol.position + (quad_pos * 0.01f));
|
||||
VertexOutput tint_symbol_1 = (VertexOutput)0;
|
||||
tint_symbol_1.position = mul(float4(position, 1.0f), tint_symbol_17(render_params, 0u));
|
||||
tint_symbol_1.color = tint_symbol.color;
|
||||
tint_symbol_1.quad_pos = tint_symbol.quad_pos;
|
||||
return tint_symbol_1;
|
||||
}
|
||||
|
||||
tint_symbol_6 vs_main(tint_symbol_5 tint_symbol_4) {
|
||||
const VertexInput tint_symbol_32 = {tint_symbol_4.position, tint_symbol_4.color, tint_symbol_4.quad_pos};
|
||||
const VertexOutput inner_result = vs_main_inner(tint_symbol_32);
|
||||
tint_symbol_6 wrapper_result = (tint_symbol_6)0;
|
||||
wrapper_result.position = inner_result.position;
|
||||
wrapper_result.color = inner_result.color;
|
||||
wrapper_result.quad_pos = inner_result.quad_pos;
|
||||
return wrapper_result;
|
||||
}
|
||||
|
||||
struct tint_symbol_8 {
|
||||
float4 color : TEXCOORD0;
|
||||
float2 quad_pos : TEXCOORD1;
|
||||
float4 position : SV_Position;
|
||||
};
|
||||
struct tint_symbol_9 {
|
||||
float4 value : SV_Target0;
|
||||
};
|
||||
|
||||
float4 fs_main_inner(VertexOutput tint_symbol) {
|
||||
float4 color = tint_symbol.color;
|
||||
color.a = (color.a * max((1.0f - length(tint_symbol.quad_pos)), 0.0f));
|
||||
return color;
|
||||
}
|
||||
|
||||
tint_symbol_9 fs_main(tint_symbol_8 tint_symbol_7) {
|
||||
const VertexOutput tint_symbol_33 = {tint_symbol_7.position, tint_symbol_7.color, tint_symbol_7.quad_pos};
|
||||
const float4 inner_result_1 = fs_main_inner(tint_symbol_33);
|
||||
tint_symbol_9 wrapper_result_1 = (tint_symbol_9)0;
|
||||
wrapper_result_1.value = inner_result_1;
|
||||
return wrapper_result_1;
|
||||
}
|
||||
|
||||
struct Particle {
|
||||
float3 position;
|
||||
float lifetime;
|
||||
float4 color;
|
||||
float3 velocity;
|
||||
};
|
||||
|
||||
cbuffer cbuffer_sim_params : register(b0, space0) {
|
||||
uint4 sim_params[2];
|
||||
};
|
||||
RWByteAddressBuffer data : register(u1, space0);
|
||||
Texture2D<float4> tint_symbol_2 : register(t2, space0);
|
||||
|
||||
struct tint_symbol_11 {
|
||||
uint3 GlobalInvocationID : SV_DispatchThreadID;
|
||||
};
|
||||
|
||||
Particle tint_symbol_20(RWByteAddressBuffer buffer, uint offset) {
|
||||
const Particle tint_symbol_34 = {asfloat(buffer.Load3((offset + 0u))), asfloat(buffer.Load((offset + 12u))), asfloat(buffer.Load4((offset + 16u))), asfloat(buffer.Load3((offset + 32u)))};
|
||||
return tint_symbol_34;
|
||||
}
|
||||
|
||||
void tint_symbol_25(RWByteAddressBuffer buffer, uint offset, Particle value) {
|
||||
buffer.Store3((offset + 0u), asuint(value.position));
|
||||
buffer.Store((offset + 12u), asuint(value.lifetime));
|
||||
buffer.Store4((offset + 16u), asuint(value.color));
|
||||
buffer.Store3((offset + 32u), asuint(value.velocity));
|
||||
}
|
||||
|
||||
void simulate_inner(uint3 GlobalInvocationID) {
|
||||
rand_seed = ((asfloat(sim_params[1]).xy + float2(GlobalInvocationID.xy)) * asfloat(sim_params[1]).zw);
|
||||
const uint idx = GlobalInvocationID.x;
|
||||
Particle particle = tint_symbol_20(data, (48u * idx));
|
||||
particle.velocity.z = (particle.velocity.z - (asfloat(sim_params[0].x) * 0.5f));
|
||||
particle.position = (particle.position + (asfloat(sim_params[0].x) * particle.velocity));
|
||||
particle.lifetime = (particle.lifetime - asfloat(sim_params[0].x));
|
||||
particle.color.a = smoothstep(0.0f, 0.5f, particle.lifetime);
|
||||
if ((particle.lifetime < 0.0f)) {
|
||||
int2 coord = int2(0, 0);
|
||||
{
|
||||
int3 tint_tmp;
|
||||
tint_symbol_2.GetDimensions(0, tint_tmp.x, tint_tmp.y, tint_tmp.z);
|
||||
int level = (tint_tmp.z - 1);
|
||||
[loop] for(; (level > 0); level = (level - 1)) {
|
||||
const float4 probabilites = tint_symbol_2.Load(int3(coord, level));
|
||||
const float4 value = float4((rand()).xxxx);
|
||||
const bool4 mask = ((value >= float4(0.0f, probabilites.xyz)) & (value < probabilites));
|
||||
coord = (coord * 2);
|
||||
coord.x = (coord.x + (any(mask.yw) ? 1 : 0));
|
||||
coord.y = (coord.y + (any(mask.zw) ? 1 : 0));
|
||||
}
|
||||
}
|
||||
int2 tint_tmp_1;
|
||||
tint_symbol_2.GetDimensions(tint_tmp_1.x, tint_tmp_1.y);
|
||||
const float2 uv = (float2(coord) / float2(tint_tmp_1));
|
||||
particle.position = float3((((uv - 0.5f) * 3.0f) * float2(1.0f, -1.0f)), 0.0f);
|
||||
particle.color = tint_symbol_2.Load(int3(coord, 0));
|
||||
particle.velocity.x = ((rand() - 0.5f) * 0.100000001f);
|
||||
particle.velocity.y = ((rand() - 0.5f) * 0.100000001f);
|
||||
particle.velocity.z = (rand() * 0.300000012f);
|
||||
particle.lifetime = (0.5f + (rand() * 2.0f));
|
||||
}
|
||||
tint_symbol_25(data, (48u * idx), particle);
|
||||
}
|
||||
|
||||
[numthreads(64, 1, 1)]
|
||||
void simulate(tint_symbol_11 tint_symbol_10) {
|
||||
simulate_inner(tint_symbol_10.GlobalInvocationID);
|
||||
return;
|
||||
}
|
||||
|
||||
cbuffer cbuffer_ubo : register(b3, space0) {
|
||||
uint4 ubo[1];
|
||||
};
|
||||
ByteAddressBuffer buf_in : register(t4, space0);
|
||||
RWByteAddressBuffer buf_out : register(u5, space0);
|
||||
Texture2D<float4> tex_in : register(t6, space0);
|
||||
RWTexture2D<float4> tex_out : register(u7, space0);
|
||||
|
||||
struct tint_symbol_13 {
|
||||
uint3 coord : SV_DispatchThreadID;
|
||||
};
|
||||
|
||||
void import_level_inner(uint3 coord) {
|
||||
const uint offset = (coord.x + (coord.y * ubo[0].x));
|
||||
buf_out.Store((4u * offset), asuint(tex_in.Load(int3(int2(coord.xy), 0)).w));
|
||||
}
|
||||
|
||||
[numthreads(64, 1, 1)]
|
||||
void import_level(tint_symbol_13 tint_symbol_12) {
|
||||
import_level_inner(tint_symbol_12.coord);
|
||||
return;
|
||||
}
|
||||
|
||||
struct tint_symbol_15 {
|
||||
uint3 coord : SV_DispatchThreadID;
|
||||
};
|
||||
|
||||
void export_level_inner(uint3 coord) {
|
||||
int2 tint_tmp_2;
|
||||
tex_out.GetDimensions(tint_tmp_2.x, tint_tmp_2.y);
|
||||
if (all((coord.xy < uint2(tint_tmp_2)))) {
|
||||
const uint dst_offset = (coord.x + (coord.y * ubo[0].x));
|
||||
const uint src_offset = ((coord.x * 2u) + ((coord.y * 2u) * ubo[0].x));
|
||||
const float a_1 = asfloat(buf_in.Load((4u * (src_offset + 0u))));
|
||||
const float b = asfloat(buf_in.Load((4u * (src_offset + 1u))));
|
||||
const float c = asfloat(buf_in.Load((4u * ((src_offset + 0u) + ubo[0].x))));
|
||||
const float d = asfloat(buf_in.Load((4u * ((src_offset + 1u) + ubo[0].x))));
|
||||
const float sum = dot(float4(a_1, b, c, d), float4((1.0f).xxxx));
|
||||
buf_out.Store((4u * dst_offset), asuint((sum / 4.0f)));
|
||||
const float4 probabilities = (float4(a_1, (a_1 + b), ((a_1 + b) + c), sum) / max(sum, 0.0001f));
|
||||
tex_out[int2(coord.xy)] = probabilities;
|
||||
}
|
||||
}
|
||||
|
||||
[numthreads(64, 1, 1)]
|
||||
void export_level(tint_symbol_15 tint_symbol_14) {
|
||||
export_level_inner(tint_symbol_14.coord);
|
||||
return;
|
||||
}
|
|
@ -0,0 +1,175 @@
|
|||
#include <metal_stdlib>
|
||||
|
||||
using namespace metal;
|
||||
|
||||
template<typename T, int N, int M>
|
||||
inline vec<T, M> operator*(matrix<T, N, M> lhs, packed_vec<T, N> rhs) {
|
||||
return lhs * vec<T, N>(rhs);
|
||||
}
|
||||
|
||||
template<typename T, int N, int M>
|
||||
inline vec<T, N> operator*(packed_vec<T, M> lhs, matrix<T, N, M> rhs) {
|
||||
return vec<T, M>(lhs) * rhs;
|
||||
}
|
||||
|
||||
struct RenderParams {
|
||||
/* 0x0000 */ float4x4 modelViewProjectionMatrix;
|
||||
/* 0x0040 */ packed_float3 right;
|
||||
/* 0x004c */ int8_t tint_pad[4];
|
||||
/* 0x0050 */ packed_float3 up;
|
||||
/* 0x005c */ int8_t tint_pad_1[4];
|
||||
};
|
||||
struct VertexInput {
|
||||
float3 position;
|
||||
float4 color;
|
||||
float2 quad_pos;
|
||||
};
|
||||
struct VertexOutput {
|
||||
float4 position;
|
||||
float4 color;
|
||||
float2 quad_pos;
|
||||
};
|
||||
struct tint_symbol_2 {
|
||||
float3 position [[attribute(0)]];
|
||||
float4 color [[attribute(1)]];
|
||||
float2 quad_pos [[attribute(2)]];
|
||||
};
|
||||
struct tint_symbol_3 {
|
||||
float4 color [[user(locn0)]];
|
||||
float2 quad_pos [[user(locn1)]];
|
||||
float4 position [[position]];
|
||||
};
|
||||
struct tint_symbol_5 {
|
||||
float4 color [[user(locn0)]];
|
||||
float2 quad_pos [[user(locn1)]];
|
||||
};
|
||||
struct tint_symbol_6 {
|
||||
float4 value [[color(0)]];
|
||||
};
|
||||
struct SimulationParams {
|
||||
/* 0x0000 */ float deltaTime;
|
||||
/* 0x0004 */ int8_t tint_pad_2[12];
|
||||
/* 0x0010 */ float4 seed;
|
||||
};
|
||||
struct Particle {
|
||||
/* 0x0000 */ packed_float3 position;
|
||||
/* 0x000c */ float lifetime;
|
||||
/* 0x0010 */ float4 color;
|
||||
/* 0x0020 */ packed_float3 velocity;
|
||||
/* 0x002c */ int8_t tint_pad_3[4];
|
||||
};
|
||||
struct Particles {
|
||||
/* 0x0000 */ Particle particles[1];
|
||||
};
|
||||
struct UBO {
|
||||
/* 0x0000 */ uint width;
|
||||
};
|
||||
struct Buffer {
|
||||
/* 0x0000 */ float weights[1];
|
||||
};
|
||||
|
||||
float rand(thread float2* const tint_symbol_9) {
|
||||
(*(tint_symbol_9))[0] = fract((cos(dot(*(tint_symbol_9), float2(23.140779495f, 232.616897583f))) * 136.816802979f));
|
||||
(*(tint_symbol_9))[1] = fract((cos(dot(*(tint_symbol_9), float2(54.478565216f, 345.841522217f))) * 534.764526367f));
|
||||
return (*(tint_symbol_9))[1];
|
||||
}
|
||||
|
||||
VertexOutput vs_main_inner(VertexInput in, const constant RenderParams* const tint_symbol_10) {
|
||||
float3 quad_pos = (float2x3((*(tint_symbol_10)).right, (*(tint_symbol_10)).up) * in.quad_pos);
|
||||
float3 position = (in.position + (quad_pos * 0.01f));
|
||||
VertexOutput out = {};
|
||||
out.position = ((*(tint_symbol_10)).modelViewProjectionMatrix * float4(position, 1.0f));
|
||||
out.color = in.color;
|
||||
out.quad_pos = in.quad_pos;
|
||||
return out;
|
||||
}
|
||||
|
||||
vertex tint_symbol_3 vs_main(const constant RenderParams* tint_symbol_11 [[buffer(0)]], tint_symbol_2 tint_symbol_1 [[stage_in]]) {
|
||||
VertexInput const tint_symbol_7 = {.position=tint_symbol_1.position, .color=tint_symbol_1.color, .quad_pos=tint_symbol_1.quad_pos};
|
||||
VertexOutput const inner_result = vs_main_inner(tint_symbol_7, tint_symbol_11);
|
||||
tint_symbol_3 wrapper_result = {};
|
||||
wrapper_result.position = inner_result.position;
|
||||
wrapper_result.color = inner_result.color;
|
||||
wrapper_result.quad_pos = inner_result.quad_pos;
|
||||
return wrapper_result;
|
||||
}
|
||||
|
||||
float4 fs_main_inner(VertexOutput in) {
|
||||
float4 color = in.color;
|
||||
color[3] = (color[3] * fmax((1.0f - length(in.quad_pos)), 0.0f));
|
||||
return color;
|
||||
}
|
||||
|
||||
fragment tint_symbol_6 fs_main(float4 position [[position]], tint_symbol_5 tint_symbol_4 [[stage_in]]) {
|
||||
VertexOutput const tint_symbol_8 = {.position=position, .color=tint_symbol_4.color, .quad_pos=tint_symbol_4.quad_pos};
|
||||
float4 const inner_result_1 = fs_main_inner(tint_symbol_8);
|
||||
tint_symbol_6 wrapper_result_1 = {};
|
||||
wrapper_result_1.value = inner_result_1;
|
||||
return wrapper_result_1;
|
||||
}
|
||||
|
||||
void simulate_inner(uint3 GlobalInvocationID, thread float2* const tint_symbol_12, const constant SimulationParams* const tint_symbol_13, device Particles* const tint_symbol_14, texture2d<float, access::sample> tint_symbol_15) {
|
||||
*(tint_symbol_12) = ((float4((*(tint_symbol_13)).seed).xy + float2(uint3(GlobalInvocationID).xy)) * float4((*(tint_symbol_13)).seed).zw);
|
||||
uint const idx = GlobalInvocationID[0];
|
||||
Particle particle = (*(tint_symbol_14)).particles[idx];
|
||||
particle.velocity[2] = (particle.velocity[2] - ((*(tint_symbol_13)).deltaTime * 0.5f));
|
||||
particle.position = (particle.position + ((*(tint_symbol_13)).deltaTime * particle.velocity));
|
||||
particle.lifetime = (particle.lifetime - (*(tint_symbol_13)).deltaTime);
|
||||
particle.color[3] = smoothstep(0.0f, 0.5f, particle.lifetime);
|
||||
if ((particle.lifetime < 0.0f)) {
|
||||
int2 coord = int2(0, 0);
|
||||
for(int level = as_type<int>((as_type<uint>(int(tint_symbol_15.get_num_mip_levels())) - as_type<uint>(1))); (level > 0); level = as_type<int>((as_type<uint>(level) - as_type<uint>(1)))) {
|
||||
float4 const probabilites = tint_symbol_15.read(uint2(coord), level);
|
||||
float4 const value = float4(rand(tint_symbol_12));
|
||||
bool4 const mask = ((value >= float4(0.0f, float4(probabilites).xyz)) & (value < probabilites));
|
||||
coord = as_type<int2>((as_type<uint2>(coord) * as_type<uint>(2)));
|
||||
coord[0] = as_type<int>((as_type<uint>(coord[0]) + as_type<uint>(select(0, 1, any(bool4(mask).yw)))));
|
||||
coord[1] = as_type<int>((as_type<uint>(coord[1]) + as_type<uint>(select(0, 1, any(bool4(mask).zw)))));
|
||||
}
|
||||
float2 const uv = (float2(coord) / float2(int2(tint_symbol_15.get_width(), tint_symbol_15.get_height())));
|
||||
particle.position = float3((((uv - 0.5f) * 3.0f) * float2(1.0f, -1.0f)), 0.0f);
|
||||
particle.color = tint_symbol_15.read(uint2(coord), 0);
|
||||
particle.velocity[0] = ((rand(tint_symbol_12) - 0.5f) * 0.100000001f);
|
||||
particle.velocity[1] = ((rand(tint_symbol_12) - 0.5f) * 0.100000001f);
|
||||
particle.velocity[2] = (rand(tint_symbol_12) * 0.300000012f);
|
||||
particle.lifetime = (0.5f + (rand(tint_symbol_12) * 2.0f));
|
||||
}
|
||||
(*(tint_symbol_14)).particles[idx] = particle;
|
||||
}
|
||||
|
||||
kernel void simulate(const constant SimulationParams* tint_symbol_17 [[buffer(0)]], device Particles* tint_symbol_18 [[buffer(1)]], texture2d<float, access::sample> tint_symbol_19 [[texture(0)]], uint3 GlobalInvocationID [[thread_position_in_grid]]) {
|
||||
thread float2 tint_symbol_16 = 0.0f;
|
||||
simulate_inner(GlobalInvocationID, &(tint_symbol_16), tint_symbol_17, tint_symbol_18, tint_symbol_19);
|
||||
return;
|
||||
}
|
||||
|
||||
void import_level_inner(uint3 coord, const constant UBO* const tint_symbol_20, device Buffer* const tint_symbol_21, texture2d<float, access::sample> tint_symbol_22) {
|
||||
uint const offset = (coord[0] + (coord[1] * (*(tint_symbol_20)).width));
|
||||
(*(tint_symbol_21)).weights[offset] = tint_symbol_22.read(uint2(int2(uint3(coord).xy)), 0)[3];
|
||||
}
|
||||
|
||||
kernel void import_level(const constant UBO* tint_symbol_23 [[buffer(2)]], device Buffer* tint_symbol_24 [[buffer(3)]], texture2d<float, access::sample> tint_symbol_25 [[texture(1)]], uint3 coord [[thread_position_in_grid]]) {
|
||||
import_level_inner(coord, tint_symbol_23, tint_symbol_24, tint_symbol_25);
|
||||
return;
|
||||
}
|
||||
|
||||
void export_level_inner(uint3 coord, texture2d<float, access::write> tint_symbol_26, const constant UBO* const tint_symbol_27, const device Buffer* const tint_symbol_28, device Buffer* const tint_symbol_29) {
|
||||
if (all((uint3(coord).xy < uint2(int2(tint_symbol_26.get_width(), tint_symbol_26.get_height()))))) {
|
||||
uint const dst_offset = (coord[0] + (coord[1] * (*(tint_symbol_27)).width));
|
||||
uint const src_offset = ((coord[0] * 2u) + ((coord[1] * 2u) * (*(tint_symbol_27)).width));
|
||||
float const a_1 = (*(tint_symbol_28)).weights[(src_offset + 0u)];
|
||||
float const b = (*(tint_symbol_28)).weights[(src_offset + 1u)];
|
||||
float const c = (*(tint_symbol_28)).weights[((src_offset + 0u) + (*(tint_symbol_27)).width)];
|
||||
float const d = (*(tint_symbol_28)).weights[((src_offset + 1u) + (*(tint_symbol_27)).width)];
|
||||
float const sum = dot(float4(a_1, b, c, d), float4(1.0f));
|
||||
(*(tint_symbol_29)).weights[dst_offset] = (sum / 4.0f);
|
||||
float4 const probabilities = (float4(a_1, (a_1 + b), ((a_1 + b) + c), sum) / fmax(sum, 0.0001f));
|
||||
tint_symbol_26.write(probabilities, uint2(int2(uint3(coord).xy)));
|
||||
}
|
||||
}
|
||||
|
||||
kernel void export_level(texture2d<float, access::write> tint_symbol_30 [[texture(2)]], const constant UBO* tint_symbol_31 [[buffer(2)]], const device Buffer* tint_symbol_32 [[buffer(4)]], device Buffer* tint_symbol_33 [[buffer(3)]], uint3 coord [[thread_position_in_grid]]) {
|
||||
export_level_inner(coord, tint_symbol_30, tint_symbol_31, tint_symbol_32, tint_symbol_33);
|
||||
return;
|
||||
}
|
||||
|
|
@ -0,0 +1,646 @@
|
|||
; SPIR-V
|
||||
; Version: 1.3
|
||||
; Generator: Google Tint Compiler; 0
|
||||
; Bound: 423
|
||||
; Schema: 0
|
||||
OpCapability Shader
|
||||
OpCapability ImageQuery
|
||||
%67 = OpExtInstImport "GLSL.std.450"
|
||||
OpMemoryModel Logical GLSL450
|
||||
OpEntryPoint Vertex %vs_main "vs_main" %position_1 %color_1 %quad_pos_1 %position_2 %color_2 %quad_pos_2 %vertex_point_size
|
||||
OpEntryPoint Fragment %fs_main "fs_main" %position_3 %color_3 %quad_pos_3 %value_1
|
||||
OpEntryPoint GLCompute %simulate "simulate" %GlobalInvocationID_1
|
||||
OpEntryPoint GLCompute %import_level "import_level" %coord_1
|
||||
OpEntryPoint GLCompute %export_level "export_level" %coord_2
|
||||
OpExecutionMode %fs_main OriginUpperLeft
|
||||
OpExecutionMode %simulate LocalSize 64 1 1
|
||||
OpExecutionMode %import_level LocalSize 64 1 1
|
||||
OpExecutionMode %export_level LocalSize 64 1 1
|
||||
OpName %position_1 "position_1"
|
||||
OpName %color_1 "color_1"
|
||||
OpName %quad_pos_1 "quad_pos_1"
|
||||
OpName %position_2 "position_2"
|
||||
OpName %color_2 "color_2"
|
||||
OpName %quad_pos_2 "quad_pos_2"
|
||||
OpName %vertex_point_size "vertex_point_size"
|
||||
OpName %position_3 "position_3"
|
||||
OpName %color_3 "color_3"
|
||||
OpName %quad_pos_3 "quad_pos_3"
|
||||
OpName %value_1 "value_1"
|
||||
OpName %GlobalInvocationID_1 "GlobalInvocationID_1"
|
||||
OpName %coord_1 "coord_1"
|
||||
OpName %coord_2 "coord_2"
|
||||
OpName %rand_seed "rand_seed"
|
||||
OpName %RenderParams "RenderParams"
|
||||
OpMemberName %RenderParams 0 "modelViewProjectionMatrix"
|
||||
OpMemberName %RenderParams 1 "right"
|
||||
OpMemberName %RenderParams 2 "up"
|
||||
OpName %render_params "render_params"
|
||||
OpName %SimulationParams "SimulationParams"
|
||||
OpMemberName %SimulationParams 0 "deltaTime"
|
||||
OpMemberName %SimulationParams 1 "seed"
|
||||
OpName %sim_params "sim_params"
|
||||
OpName %Particles "Particles"
|
||||
OpMemberName %Particles 0 "particles"
|
||||
OpName %Particle "Particle"
|
||||
OpMemberName %Particle 0 "position"
|
||||
OpMemberName %Particle 1 "lifetime"
|
||||
OpMemberName %Particle 2 "color"
|
||||
OpMemberName %Particle 3 "velocity"
|
||||
OpName %data "data"
|
||||
OpName %texture "texture"
|
||||
OpName %UBO "UBO"
|
||||
OpMemberName %UBO 0 "width"
|
||||
OpName %ubo "ubo"
|
||||
OpName %Buffer "Buffer"
|
||||
OpMemberName %Buffer 0 "weights"
|
||||
OpName %buf_in "buf_in"
|
||||
OpName %buf_out "buf_out"
|
||||
OpName %tex_in "tex_in"
|
||||
OpName %tex_out "tex_out"
|
||||
OpName %rand "rand"
|
||||
OpName %VertexOutput "VertexOutput"
|
||||
OpMemberName %VertexOutput 0 "position"
|
||||
OpMemberName %VertexOutput 1 "color"
|
||||
OpMemberName %VertexOutput 2 "quad_pos"
|
||||
OpName %VertexInput "VertexInput"
|
||||
OpMemberName %VertexInput 0 "position"
|
||||
OpMemberName %VertexInput 1 "color"
|
||||
OpMemberName %VertexInput 2 "quad_pos"
|
||||
OpName %vs_main_inner "vs_main_inner"
|
||||
OpName %in "in"
|
||||
OpName %quad_pos "quad_pos"
|
||||
OpName %position "position"
|
||||
OpName %out "out"
|
||||
OpName %vs_main "vs_main"
|
||||
OpName %fs_main_inner "fs_main_inner"
|
||||
OpName %in_0 "in"
|
||||
OpName %color "color"
|
||||
OpName %fs_main "fs_main"
|
||||
OpName %simulate_inner "simulate_inner"
|
||||
OpName %GlobalInvocationID "GlobalInvocationID"
|
||||
OpName %particle "particle"
|
||||
OpName %coord "coord"
|
||||
OpName %level "level"
|
||||
OpName %simulate "simulate"
|
||||
OpName %import_level_inner "import_level_inner"
|
||||
OpName %coord_0 "coord"
|
||||
OpName %import_level "import_level"
|
||||
OpName %export_level_inner "export_level_inner"
|
||||
OpName %coord_3 "coord"
|
||||
OpName %export_level "export_level"
|
||||
OpDecorate %position_1 Location 0
|
||||
OpDecorate %color_1 Location 1
|
||||
OpDecorate %quad_pos_1 Location 2
|
||||
OpDecorate %position_2 BuiltIn Position
|
||||
OpDecorate %color_2 Location 0
|
||||
OpDecorate %quad_pos_2 Location 1
|
||||
OpDecorate %vertex_point_size BuiltIn PointSize
|
||||
OpDecorate %position_3 BuiltIn FragCoord
|
||||
OpDecorate %color_3 Location 0
|
||||
OpDecorate %quad_pos_3 Location 1
|
||||
OpDecorate %value_1 Location 0
|
||||
OpDecorate %GlobalInvocationID_1 BuiltIn GlobalInvocationId
|
||||
OpDecorate %coord_1 BuiltIn GlobalInvocationId
|
||||
OpDecorate %coord_2 BuiltIn GlobalInvocationId
|
||||
OpDecorate %RenderParams Block
|
||||
OpMemberDecorate %RenderParams 0 Offset 0
|
||||
OpMemberDecorate %RenderParams 0 ColMajor
|
||||
OpMemberDecorate %RenderParams 0 MatrixStride 16
|
||||
OpMemberDecorate %RenderParams 1 Offset 64
|
||||
OpMemberDecorate %RenderParams 2 Offset 80
|
||||
OpDecorate %render_params NonWritable
|
||||
OpDecorate %render_params Binding 0
|
||||
OpDecorate %render_params DescriptorSet 0
|
||||
OpDecorate %SimulationParams Block
|
||||
OpMemberDecorate %SimulationParams 0 Offset 0
|
||||
OpMemberDecorate %SimulationParams 1 Offset 16
|
||||
OpDecorate %sim_params NonWritable
|
||||
OpDecorate %sim_params Binding 0
|
||||
OpDecorate %sim_params DescriptorSet 0
|
||||
OpDecorate %Particles Block
|
||||
OpMemberDecorate %Particles 0 Offset 0
|
||||
OpMemberDecorate %Particle 0 Offset 0
|
||||
OpMemberDecorate %Particle 1 Offset 12
|
||||
OpMemberDecorate %Particle 2 Offset 16
|
||||
OpMemberDecorate %Particle 3 Offset 32
|
||||
OpDecorate %_runtimearr_Particle ArrayStride 48
|
||||
OpDecorate %data Binding 1
|
||||
OpDecorate %data DescriptorSet 0
|
||||
OpDecorate %texture Binding 2
|
||||
OpDecorate %texture DescriptorSet 0
|
||||
OpDecorate %UBO Block
|
||||
OpMemberDecorate %UBO 0 Offset 0
|
||||
OpDecorate %ubo NonWritable
|
||||
OpDecorate %ubo Binding 3
|
||||
OpDecorate %ubo DescriptorSet 0
|
||||
OpDecorate %Buffer Block
|
||||
OpMemberDecorate %Buffer 0 Offset 0
|
||||
OpDecorate %_runtimearr_float ArrayStride 4
|
||||
OpDecorate %buf_in NonWritable
|
||||
OpDecorate %buf_in Binding 4
|
||||
OpDecorate %buf_in DescriptorSet 0
|
||||
OpDecorate %buf_out Binding 5
|
||||
OpDecorate %buf_out DescriptorSet 0
|
||||
OpDecorate %tex_in Binding 6
|
||||
OpDecorate %tex_in DescriptorSet 0
|
||||
OpDecorate %tex_out NonReadable
|
||||
OpDecorate %tex_out Binding 7
|
||||
OpDecorate %tex_out DescriptorSet 0
|
||||
OpMemberDecorate %VertexOutput 0 Offset 0
|
||||
OpMemberDecorate %VertexOutput 1 Offset 16
|
||||
OpMemberDecorate %VertexOutput 2 Offset 32
|
||||
OpMemberDecorate %VertexInput 0 Offset 0
|
||||
OpMemberDecorate %VertexInput 1 Offset 16
|
||||
OpMemberDecorate %VertexInput 2 Offset 32
|
||||
%float = OpTypeFloat 32
|
||||
%v3float = OpTypeVector %float 3
|
||||
%_ptr_Input_v3float = OpTypePointer Input %v3float
|
||||
%position_1 = OpVariable %_ptr_Input_v3float Input
|
||||
%v4float = OpTypeVector %float 4
|
||||
%_ptr_Input_v4float = OpTypePointer Input %v4float
|
||||
%color_1 = OpVariable %_ptr_Input_v4float Input
|
||||
%v2float = OpTypeVector %float 2
|
||||
%_ptr_Input_v2float = OpTypePointer Input %v2float
|
||||
%quad_pos_1 = OpVariable %_ptr_Input_v2float Input
|
||||
%_ptr_Output_v4float = OpTypePointer Output %v4float
|
||||
%13 = OpConstantNull %v4float
|
||||
%position_2 = OpVariable %_ptr_Output_v4float Output %13
|
||||
%color_2 = OpVariable %_ptr_Output_v4float Output %13
|
||||
%_ptr_Output_v2float = OpTypePointer Output %v2float
|
||||
%17 = OpConstantNull %v2float
|
||||
%quad_pos_2 = OpVariable %_ptr_Output_v2float Output %17
|
||||
%_ptr_Output_float = OpTypePointer Output %float
|
||||
%20 = OpConstantNull %float
|
||||
%vertex_point_size = OpVariable %_ptr_Output_float Output %20
|
||||
%position_3 = OpVariable %_ptr_Input_v4float Input
|
||||
%color_3 = OpVariable %_ptr_Input_v4float Input
|
||||
%quad_pos_3 = OpVariable %_ptr_Input_v2float Input
|
||||
%value_1 = OpVariable %_ptr_Output_v4float Output %13
|
||||
%uint = OpTypeInt 32 0
|
||||
%v3uint = OpTypeVector %uint 3
|
||||
%_ptr_Input_v3uint = OpTypePointer Input %v3uint
|
||||
%GlobalInvocationID_1 = OpVariable %_ptr_Input_v3uint Input
|
||||
%coord_1 = OpVariable %_ptr_Input_v3uint Input
|
||||
%coord_2 = OpVariable %_ptr_Input_v3uint Input
|
||||
%_ptr_Private_v2float = OpTypePointer Private %v2float
|
||||
%rand_seed = OpVariable %_ptr_Private_v2float Private %17
|
||||
%mat4v4float = OpTypeMatrix %v4float 4
|
||||
%RenderParams = OpTypeStruct %mat4v4float %v3float %v3float
|
||||
%_ptr_Uniform_RenderParams = OpTypePointer Uniform %RenderParams
|
||||
%render_params = OpVariable %_ptr_Uniform_RenderParams Uniform
|
||||
%SimulationParams = OpTypeStruct %float %v4float
|
||||
%_ptr_Uniform_SimulationParams = OpTypePointer Uniform %SimulationParams
|
||||
%sim_params = OpVariable %_ptr_Uniform_SimulationParams Uniform
|
||||
%Particle = OpTypeStruct %v3float %float %v4float %v3float
|
||||
%_runtimearr_Particle = OpTypeRuntimeArray %Particle
|
||||
%Particles = OpTypeStruct %_runtimearr_Particle
|
||||
%_ptr_StorageBuffer_Particles = OpTypePointer StorageBuffer %Particles
|
||||
%data = OpVariable %_ptr_StorageBuffer_Particles StorageBuffer
|
||||
%47 = OpTypeImage %float 2D 0 0 0 1 Unknown
|
||||
%_ptr_UniformConstant_47 = OpTypePointer UniformConstant %47
|
||||
%texture = OpVariable %_ptr_UniformConstant_47 UniformConstant
|
||||
%UBO = OpTypeStruct %uint
|
||||
%_ptr_Uniform_UBO = OpTypePointer Uniform %UBO
|
||||
%ubo = OpVariable %_ptr_Uniform_UBO Uniform
|
||||
%_runtimearr_float = OpTypeRuntimeArray %float
|
||||
%Buffer = OpTypeStruct %_runtimearr_float
|
||||
%_ptr_StorageBuffer_Buffer = OpTypePointer StorageBuffer %Buffer
|
||||
%buf_in = OpVariable %_ptr_StorageBuffer_Buffer StorageBuffer
|
||||
%buf_out = OpVariable %_ptr_StorageBuffer_Buffer StorageBuffer
|
||||
%tex_in = OpVariable %_ptr_UniformConstant_47 UniformConstant
|
||||
%59 = OpTypeImage %float 2D 0 0 0 2 Rgba8
|
||||
%_ptr_UniformConstant_59 = OpTypePointer UniformConstant %59
|
||||
%tex_out = OpVariable %_ptr_UniformConstant_59 UniformConstant
|
||||
%60 = OpTypeFunction %float
|
||||
%uint_0 = OpConstant %uint 0
|
||||
%_ptr_Private_float = OpTypePointer Private %float
|
||||
%float_23_1407795 = OpConstant %float 23.1407795
|
||||
%float_232_616898 = OpConstant %float 232.616898
|
||||
%73 = OpConstantComposite %v2float %float_23_1407795 %float_232_616898
|
||||
%float_136_816803 = OpConstant %float 136.816803
|
||||
%uint_1 = OpConstant %uint 1
|
||||
%float_54_4785652 = OpConstant %float 54.4785652
|
||||
%float_345_841522 = OpConstant %float 345.841522
|
||||
%84 = OpConstantComposite %v2float %float_54_4785652 %float_345_841522
|
||||
%float_534_764526 = OpConstant %float 534.764526
|
||||
%VertexOutput = OpTypeStruct %v4float %v4float %v2float
|
||||
%VertexInput = OpTypeStruct %v3float %v4float %v2float
|
||||
%89 = OpTypeFunction %VertexOutput %VertexInput
|
||||
%mat2v3float = OpTypeMatrix %v3float 2
|
||||
%_ptr_Uniform_v3float = OpTypePointer Uniform %v3float
|
||||
%uint_2 = OpConstant %uint 2
|
||||
%_ptr_Function_v3float = OpTypePointer Function %v3float
|
||||
%107 = OpConstantNull %v3float
|
||||
%float_0_00999999978 = OpConstant %float 0.00999999978
|
||||
%_ptr_Function_VertexOutput = OpTypePointer Function %VertexOutput
|
||||
%116 = OpConstantNull %VertexOutput
|
||||
%_ptr_Function_v4float = OpTypePointer Function %v4float
|
||||
%_ptr_Uniform_mat4v4float = OpTypePointer Uniform %mat4v4float
|
||||
%float_1 = OpConstant %float 1
|
||||
%_ptr_Function_v2float = OpTypePointer Function %v2float
|
||||
%void = OpTypeVoid
|
||||
%135 = OpTypeFunction %void
|
||||
%147 = OpTypeFunction %v4float %VertexOutput
|
||||
%uint_3 = OpConstant %uint 3
|
||||
%_ptr_Function_float = OpTypePointer Function %float
|
||||
%float_0 = OpConstant %float 0
|
||||
%172 = OpTypeFunction %void %v3uint
|
||||
%_ptr_Uniform_v4float = OpTypePointer Uniform %v4float
|
||||
%v2uint = OpTypeVector %uint 2
|
||||
%_ptr_StorageBuffer_Particle = OpTypePointer StorageBuffer %Particle
|
||||
%_ptr_Function_Particle = OpTypePointer Function %Particle
|
||||
%194 = OpConstantNull %Particle
|
||||
%_ptr_Uniform_float = OpTypePointer Uniform %float
|
||||
%float_0_5 = OpConstant %float 0.5
|
||||
%bool = OpTypeBool
|
||||
%int = OpTypeInt 32 1
|
||||
%v2int = OpTypeVector %int 2
|
||||
%int_0 = OpConstant %int 0
|
||||
%232 = OpConstantComposite %v2int %int_0 %int_0
|
||||
%_ptr_Function_v2int = OpTypePointer Function %v2int
|
||||
%235 = OpConstantNull %v2int
|
||||
%int_1 = OpConstant %int 1
|
||||
%_ptr_Function_int = OpTypePointer Function %int
|
||||
%242 = OpConstantNull %int
|
||||
%v4bool = OpTypeVector %bool 4
|
||||
%int_2 = OpConstant %int 2
|
||||
%v2bool = OpTypeVector %bool 2
|
||||
%float_3 = OpConstant %float 3
|
||||
%float_n1 = OpConstant %float -1
|
||||
%302 = OpConstantComposite %v2float %float_1 %float_n1
|
||||
%float_0_100000001 = OpConstant %float 0.100000001
|
||||
%float_0_300000012 = OpConstant %float 0.300000012
|
||||
%float_2 = OpConstant %float 2
|
||||
%_ptr_Uniform_uint = OpTypePointer Uniform %uint
|
||||
%_ptr_StorageBuffer_float = OpTypePointer StorageBuffer %float
|
||||
%402 = OpConstantComposite %v4float %float_1 %float_1 %float_1 %float_1
|
||||
%float_4 = OpConstant %float 4
|
||||
%float_9_99999975en05 = OpConstant %float 9.99999975e-05
|
||||
%rand = OpFunction %float None %60
|
||||
%62 = OpLabel
|
||||
%65 = OpAccessChain %_ptr_Private_float %rand_seed %uint_0
|
||||
%70 = OpLoad %v2float %rand_seed
|
||||
%69 = OpDot %float %70 %73
|
||||
%68 = OpExtInst %float %67 Cos %69
|
||||
%75 = OpFMul %float %68 %float_136_816803
|
||||
%66 = OpExtInst %float %67 Fract %75
|
||||
OpStore %65 %66
|
||||
%77 = OpAccessChain %_ptr_Private_float %rand_seed %uint_1
|
||||
%81 = OpLoad %v2float %rand_seed
|
||||
%80 = OpDot %float %81 %84
|
||||
%79 = OpExtInst %float %67 Cos %80
|
||||
%86 = OpFMul %float %79 %float_534_764526
|
||||
%78 = OpExtInst %float %67 Fract %86
|
||||
OpStore %77 %78
|
||||
%87 = OpAccessChain %_ptr_Private_float %rand_seed %uint_1
|
||||
%88 = OpLoad %float %87
|
||||
OpReturnValue %88
|
||||
OpFunctionEnd
|
||||
%vs_main_inner = OpFunction %VertexOutput None %89
|
||||
%in = OpFunctionParameter %VertexInput
|
||||
%94 = OpLabel
|
||||
%quad_pos = OpVariable %_ptr_Function_v3float Function %107
|
||||
%position = OpVariable %_ptr_Function_v3float Function %107
|
||||
%out = OpVariable %_ptr_Function_VertexOutput Function %116
|
||||
%97 = OpAccessChain %_ptr_Uniform_v3float %render_params %uint_1
|
||||
%98 = OpLoad %v3float %97
|
||||
%100 = OpAccessChain %_ptr_Uniform_v3float %render_params %uint_2
|
||||
%101 = OpLoad %v3float %100
|
||||
%102 = OpCompositeConstruct %mat2v3float %98 %101
|
||||
%103 = OpCompositeExtract %v2float %in 2
|
||||
%104 = OpMatrixTimesVector %v3float %102 %103
|
||||
OpStore %quad_pos %104
|
||||
%108 = OpCompositeExtract %v3float %in 0
|
||||
%109 = OpLoad %v3float %quad_pos
|
||||
%111 = OpVectorTimesScalar %v3float %109 %float_0_00999999978
|
||||
%112 = OpFAdd %v3float %108 %111
|
||||
OpStore %position %112
|
||||
%118 = OpAccessChain %_ptr_Function_v4float %out %uint_0
|
||||
%120 = OpAccessChain %_ptr_Uniform_mat4v4float %render_params %uint_0
|
||||
%121 = OpLoad %mat4v4float %120
|
||||
%122 = OpLoad %v3float %position
|
||||
%123 = OpCompositeExtract %float %122 0
|
||||
%124 = OpCompositeExtract %float %122 1
|
||||
%125 = OpCompositeExtract %float %122 2
|
||||
%127 = OpCompositeConstruct %v4float %123 %124 %125 %float_1
|
||||
%128 = OpMatrixTimesVector %v4float %121 %127
|
||||
OpStore %118 %128
|
||||
%129 = OpAccessChain %_ptr_Function_v4float %out %uint_1
|
||||
%130 = OpCompositeExtract %v4float %in 1
|
||||
OpStore %129 %130
|
||||
%132 = OpAccessChain %_ptr_Function_v2float %out %uint_2
|
||||
%133 = OpCompositeExtract %v2float %in 2
|
||||
OpStore %132 %133
|
||||
%134 = OpLoad %VertexOutput %out
|
||||
OpReturnValue %134
|
||||
OpFunctionEnd
|
||||
%vs_main = OpFunction %void None %135
|
||||
%138 = OpLabel
|
||||
%140 = OpLoad %v3float %position_1
|
||||
%141 = OpLoad %v4float %color_1
|
||||
%142 = OpLoad %v2float %quad_pos_1
|
||||
%143 = OpCompositeConstruct %VertexInput %140 %141 %142
|
||||
%139 = OpFunctionCall %VertexOutput %vs_main_inner %143
|
||||
%144 = OpCompositeExtract %v4float %139 0
|
||||
OpStore %position_2 %144
|
||||
%145 = OpCompositeExtract %v4float %139 1
|
||||
OpStore %color_2 %145
|
||||
%146 = OpCompositeExtract %v2float %139 2
|
||||
OpStore %quad_pos_2 %146
|
||||
OpStore %vertex_point_size %float_1
|
||||
OpReturn
|
||||
OpFunctionEnd
|
||||
%fs_main_inner = OpFunction %v4float None %147
|
||||
%in_0 = OpFunctionParameter %VertexOutput
|
||||
%150 = OpLabel
|
||||
%color = OpVariable %_ptr_Function_v4float Function %13
|
||||
%151 = OpCompositeExtract %v4float %in_0 1
|
||||
OpStore %color %151
|
||||
%155 = OpAccessChain %_ptr_Function_float %color %uint_3
|
||||
%156 = OpAccessChain %_ptr_Function_float %color %uint_3
|
||||
%157 = OpLoad %float %156
|
||||
%160 = OpCompositeExtract %v2float %in_0 2
|
||||
%159 = OpExtInst %float %67 Length %160
|
||||
%161 = OpFSub %float %float_1 %159
|
||||
%158 = OpExtInst %float %67 NMax %161 %float_0
|
||||
%163 = OpFMul %float %157 %158
|
||||
OpStore %155 %163
|
||||
%164 = OpLoad %v4float %color
|
||||
OpReturnValue %164
|
||||
OpFunctionEnd
|
||||
%fs_main = OpFunction %void None %135
|
||||
%166 = OpLabel
|
||||
%168 = OpLoad %v4float %position_3
|
||||
%169 = OpLoad %v4float %color_3
|
||||
%170 = OpLoad %v2float %quad_pos_3
|
||||
%171 = OpCompositeConstruct %VertexOutput %168 %169 %170
|
||||
%167 = OpFunctionCall %v4float %fs_main_inner %171
|
||||
OpStore %value_1 %167
|
||||
OpReturn
|
||||
OpFunctionEnd
|
||||
%simulate_inner = OpFunction %void None %172
|
||||
%GlobalInvocationID = OpFunctionParameter %v3uint
|
||||
%175 = OpLabel
|
||||
%particle = OpVariable %_ptr_Function_Particle Function %194
|
||||
%coord = OpVariable %_ptr_Function_v2int Function %235
|
||||
%level = OpVariable %_ptr_Function_int Function %242
|
||||
%270 = OpVariable %_ptr_Function_v2int Function %235
|
||||
%297 = OpVariable %_ptr_Function_v2float Function %17
|
||||
%177 = OpAccessChain %_ptr_Uniform_v4float %sim_params %uint_1
|
||||
%178 = OpLoad %v4float %177
|
||||
%179 = OpVectorShuffle %v2float %178 %178 0 1
|
||||
%182 = OpVectorShuffle %v2uint %GlobalInvocationID %GlobalInvocationID 0 1
|
||||
%180 = OpConvertUToF %v2float %182
|
||||
%183 = OpFAdd %v2float %179 %180
|
||||
%184 = OpAccessChain %_ptr_Uniform_v4float %sim_params %uint_1
|
||||
%185 = OpLoad %v4float %184
|
||||
%186 = OpVectorShuffle %v2float %185 %185 2 3
|
||||
%187 = OpFMul %v2float %183 %186
|
||||
OpStore %rand_seed %187
|
||||
%188 = OpCompositeExtract %uint %GlobalInvocationID 0
|
||||
%190 = OpAccessChain %_ptr_StorageBuffer_Particle %data %uint_0 %188
|
||||
%191 = OpLoad %Particle %190
|
||||
OpStore %particle %191
|
||||
%195 = OpAccessChain %_ptr_Function_float %particle %uint_3 %uint_2
|
||||
%196 = OpAccessChain %_ptr_Function_float %particle %uint_3 %uint_2
|
||||
%197 = OpLoad %float %196
|
||||
%199 = OpAccessChain %_ptr_Uniform_float %sim_params %uint_0
|
||||
%200 = OpLoad %float %199
|
||||
%202 = OpFMul %float %200 %float_0_5
|
||||
%203 = OpFSub %float %197 %202
|
||||
OpStore %195 %203
|
||||
%204 = OpAccessChain %_ptr_Function_v3float %particle %uint_0
|
||||
%205 = OpAccessChain %_ptr_Function_v3float %particle %uint_0
|
||||
%206 = OpLoad %v3float %205
|
||||
%207 = OpAccessChain %_ptr_Uniform_float %sim_params %uint_0
|
||||
%208 = OpLoad %float %207
|
||||
%209 = OpAccessChain %_ptr_Function_v3float %particle %uint_3
|
||||
%210 = OpLoad %v3float %209
|
||||
%211 = OpVectorTimesScalar %v3float %210 %208
|
||||
%212 = OpFAdd %v3float %206 %211
|
||||
OpStore %204 %212
|
||||
%213 = OpAccessChain %_ptr_Function_float %particle %uint_1
|
||||
%214 = OpAccessChain %_ptr_Function_float %particle %uint_1
|
||||
%215 = OpLoad %float %214
|
||||
%216 = OpAccessChain %_ptr_Uniform_float %sim_params %uint_0
|
||||
%217 = OpLoad %float %216
|
||||
%218 = OpFSub %float %215 %217
|
||||
OpStore %213 %218
|
||||
%219 = OpAccessChain %_ptr_Function_float %particle %uint_2 %uint_3
|
||||
%221 = OpAccessChain %_ptr_Function_float %particle %uint_1
|
||||
%222 = OpLoad %float %221
|
||||
%220 = OpExtInst %float %67 SmoothStep %float_0 %float_0_5 %222
|
||||
OpStore %219 %220
|
||||
%223 = OpAccessChain %_ptr_Function_float %particle %uint_1
|
||||
%224 = OpLoad %float %223
|
||||
%225 = OpFOrdLessThan %bool %224 %float_0
|
||||
OpSelectionMerge %227 None
|
||||
OpBranchConditional %225 %228 %227
|
||||
%228 = OpLabel
|
||||
OpStore %coord %232
|
||||
%237 = OpLoad %47 %texture
|
||||
%236 = OpImageQueryLevels %int %237
|
||||
%239 = OpISub %int %236 %int_1
|
||||
OpStore %level %239
|
||||
OpBranch %243
|
||||
%243 = OpLabel
|
||||
OpLoopMerge %244 %245 None
|
||||
OpBranch %246
|
||||
%246 = OpLabel
|
||||
%248 = OpLoad %int %level
|
||||
%249 = OpSGreaterThan %bool %248 %int_0
|
||||
%247 = OpLogicalNot %bool %249
|
||||
OpSelectionMerge %250 None
|
||||
OpBranchConditional %247 %251 %250
|
||||
%251 = OpLabel
|
||||
OpBranch %244
|
||||
%250 = OpLabel
|
||||
%253 = OpLoad %47 %texture
|
||||
%254 = OpLoad %v2int %coord
|
||||
%255 = OpLoad %int %level
|
||||
%252 = OpImageFetch %v4float %253 %254 Lod %255
|
||||
%256 = OpFunctionCall %float %rand
|
||||
%257 = OpCompositeConstruct %v4float %256 %256 %256 %256
|
||||
%258 = OpVectorShuffle %v3float %252 %252 0 1 2
|
||||
%259 = OpCompositeExtract %float %258 0
|
||||
%260 = OpCompositeExtract %float %258 1
|
||||
%261 = OpCompositeExtract %float %258 2
|
||||
%262 = OpCompositeConstruct %v4float %float_0 %259 %260 %261
|
||||
%263 = OpFOrdGreaterThanEqual %v4bool %257 %262
|
||||
%265 = OpFOrdLessThan %v4bool %257 %252
|
||||
%266 = OpLogicalAnd %v4bool %263 %265
|
||||
%267 = OpLoad %v2int %coord
|
||||
%271 = OpCompositeConstruct %v2int %int_2 %int_2
|
||||
%269 = OpIMul %v2int %267 %271
|
||||
OpStore %coord %269
|
||||
%272 = OpAccessChain %_ptr_Function_int %coord %uint_0
|
||||
%273 = OpAccessChain %_ptr_Function_int %coord %uint_0
|
||||
%274 = OpLoad %int %273
|
||||
%278 = OpVectorShuffle %v2bool %266 %266 1 3
|
||||
%276 = OpAny %bool %278
|
||||
%275 = OpSelect %int %276 %int_1 %int_0
|
||||
%279 = OpIAdd %int %274 %275
|
||||
OpStore %272 %279
|
||||
%280 = OpAccessChain %_ptr_Function_int %coord %uint_1
|
||||
%281 = OpAccessChain %_ptr_Function_int %coord %uint_1
|
||||
%282 = OpLoad %int %281
|
||||
%285 = OpVectorShuffle %v2bool %266 %266 2 3
|
||||
%284 = OpAny %bool %285
|
||||
%283 = OpSelect %int %284 %int_1 %int_0
|
||||
%286 = OpIAdd %int %282 %283
|
||||
OpStore %280 %286
|
||||
OpBranch %245
|
||||
%245 = OpLabel
|
||||
%287 = OpLoad %int %level
|
||||
%288 = OpISub %int %287 %int_1
|
||||
OpStore %level %288
|
||||
OpBranch %243
|
||||
%244 = OpLabel
|
||||
%290 = OpLoad %v2int %coord
|
||||
%289 = OpConvertSToF %v2float %290
|
||||
%293 = OpLoad %47 %texture
|
||||
%292 = OpImageQuerySizeLod %v2int %293 %int_0
|
||||
%291 = OpConvertSToF %v2float %292
|
||||
%294 = OpFDiv %v2float %289 %291
|
||||
%295 = OpAccessChain %_ptr_Function_v3float %particle %uint_0
|
||||
%298 = OpCompositeConstruct %v2float %float_0_5 %float_0_5
|
||||
%296 = OpFSub %v2float %294 %298
|
||||
%300 = OpVectorTimesScalar %v2float %296 %float_3
|
||||
%303 = OpFMul %v2float %300 %302
|
||||
%304 = OpCompositeExtract %float %303 0
|
||||
%305 = OpCompositeExtract %float %303 1
|
||||
%306 = OpCompositeConstruct %v3float %304 %305 %float_0
|
||||
OpStore %295 %306
|
||||
%307 = OpAccessChain %_ptr_Function_v4float %particle %uint_2
|
||||
%309 = OpLoad %47 %texture
|
||||
%310 = OpLoad %v2int %coord
|
||||
%308 = OpImageFetch %v4float %309 %310 Lod %int_0
|
||||
OpStore %307 %308
|
||||
%311 = OpAccessChain %_ptr_Function_float %particle %uint_3 %uint_0
|
||||
%312 = OpFunctionCall %float %rand
|
||||
%313 = OpFSub %float %312 %float_0_5
|
||||
%315 = OpFMul %float %313 %float_0_100000001
|
||||
OpStore %311 %315
|
||||
%316 = OpAccessChain %_ptr_Function_float %particle %uint_3 %uint_1
|
||||
%317 = OpFunctionCall %float %rand
|
||||
%318 = OpFSub %float %317 %float_0_5
|
||||
%319 = OpFMul %float %318 %float_0_100000001
|
||||
OpStore %316 %319
|
||||
%320 = OpAccessChain %_ptr_Function_float %particle %uint_3 %uint_2
|
||||
%321 = OpFunctionCall %float %rand
|
||||
%323 = OpFMul %float %321 %float_0_300000012
|
||||
OpStore %320 %323
|
||||
%324 = OpAccessChain %_ptr_Function_float %particle %uint_1
|
||||
%325 = OpFunctionCall %float %rand
|
||||
%327 = OpFMul %float %325 %float_2
|
||||
%328 = OpFAdd %float %float_0_5 %327
|
||||
OpStore %324 %328
|
||||
OpBranch %227
|
||||
%227 = OpLabel
|
||||
%329 = OpAccessChain %_ptr_StorageBuffer_Particle %data %uint_0 %188
|
||||
%330 = OpLoad %Particle %particle
|
||||
OpStore %329 %330
|
||||
OpReturn
|
||||
OpFunctionEnd
|
||||
%simulate = OpFunction %void None %135
|
||||
%332 = OpLabel
|
||||
%334 = OpLoad %v3uint %GlobalInvocationID_1
|
||||
%333 = OpFunctionCall %void %simulate_inner %334
|
||||
OpReturn
|
||||
OpFunctionEnd
|
||||
%import_level_inner = OpFunction %void None %172
|
||||
%coord_0 = OpFunctionParameter %v3uint
|
||||
%337 = OpLabel
|
||||
%339 = OpCompositeExtract %uint %coord_0 0
|
||||
%340 = OpCompositeExtract %uint %coord_0 1
|
||||
%342 = OpAccessChain %_ptr_Uniform_uint %ubo %uint_0
|
||||
%343 = OpLoad %uint %342
|
||||
%344 = OpIMul %uint %340 %343
|
||||
%345 = OpIAdd %uint %339 %344
|
||||
%347 = OpAccessChain %_ptr_StorageBuffer_float %buf_out %uint_0 %345
|
||||
%349 = OpLoad %47 %tex_in
|
||||
%351 = OpVectorShuffle %v2uint %coord_0 %coord_0 0 1
|
||||
%350 = OpBitcast %v2int %351
|
||||
%348 = OpImageFetch %v4float %349 %350 Lod %int_0
|
||||
%352 = OpCompositeExtract %float %348 3
|
||||
OpStore %347 %352
|
||||
OpReturn
|
||||
OpFunctionEnd
|
||||
%import_level = OpFunction %void None %135
|
||||
%354 = OpLabel
|
||||
%356 = OpLoad %v3uint %coord_1
|
||||
%355 = OpFunctionCall %void %import_level_inner %356
|
||||
OpReturn
|
||||
OpFunctionEnd
|
||||
%export_level_inner = OpFunction %void None %172
|
||||
%coord_3 = OpFunctionParameter %v3uint
|
||||
%359 = OpLabel
|
||||
%413 = OpVariable %_ptr_Function_v4float Function %13
|
||||
%361 = OpVectorShuffle %v2uint %coord_3 %coord_3 0 1
|
||||
%364 = OpLoad %59 %tex_out
|
||||
%363 = OpImageQuerySize %v2int %364
|
||||
%362 = OpBitcast %v2uint %363
|
||||
%365 = OpULessThan %v2bool %361 %362
|
||||
%360 = OpAll %bool %365
|
||||
OpSelectionMerge %366 None
|
||||
OpBranchConditional %360 %367 %366
|
||||
%367 = OpLabel
|
||||
%368 = OpCompositeExtract %uint %coord_3 0
|
||||
%369 = OpCompositeExtract %uint %coord_3 1
|
||||
%370 = OpAccessChain %_ptr_Uniform_uint %ubo %uint_0
|
||||
%371 = OpLoad %uint %370
|
||||
%372 = OpIMul %uint %369 %371
|
||||
%373 = OpIAdd %uint %368 %372
|
||||
%374 = OpCompositeExtract %uint %coord_3 0
|
||||
%375 = OpIMul %uint %374 %uint_2
|
||||
%376 = OpCompositeExtract %uint %coord_3 1
|
||||
%377 = OpIMul %uint %376 %uint_2
|
||||
%378 = OpAccessChain %_ptr_Uniform_uint %ubo %uint_0
|
||||
%379 = OpLoad %uint %378
|
||||
%380 = OpIMul %uint %377 %379
|
||||
%381 = OpIAdd %uint %375 %380
|
||||
%382 = OpIAdd %uint %381 %uint_0
|
||||
%383 = OpAccessChain %_ptr_StorageBuffer_float %buf_in %uint_0 %382
|
||||
%384 = OpLoad %float %383
|
||||
%385 = OpIAdd %uint %381 %uint_1
|
||||
%386 = OpAccessChain %_ptr_StorageBuffer_float %buf_in %uint_0 %385
|
||||
%387 = OpLoad %float %386
|
||||
%388 = OpIAdd %uint %381 %uint_0
|
||||
%389 = OpAccessChain %_ptr_Uniform_uint %ubo %uint_0
|
||||
%390 = OpLoad %uint %389
|
||||
%391 = OpIAdd %uint %388 %390
|
||||
%392 = OpAccessChain %_ptr_StorageBuffer_float %buf_in %uint_0 %391
|
||||
%393 = OpLoad %float %392
|
||||
%394 = OpIAdd %uint %381 %uint_1
|
||||
%395 = OpAccessChain %_ptr_Uniform_uint %ubo %uint_0
|
||||
%396 = OpLoad %uint %395
|
||||
%397 = OpIAdd %uint %394 %396
|
||||
%398 = OpAccessChain %_ptr_StorageBuffer_float %buf_in %uint_0 %397
|
||||
%399 = OpLoad %float %398
|
||||
%401 = OpCompositeConstruct %v4float %384 %387 %393 %399
|
||||
%400 = OpDot %float %401 %402
|
||||
%403 = OpAccessChain %_ptr_StorageBuffer_float %buf_out %uint_0 %373
|
||||
%405 = OpFDiv %float %400 %float_4
|
||||
OpStore %403 %405
|
||||
%406 = OpFAdd %float %384 %387
|
||||
%407 = OpFAdd %float %384 %387
|
||||
%408 = OpFAdd %float %407 %393
|
||||
%409 = OpCompositeConstruct %v4float %384 %406 %408 %400
|
||||
%410 = OpExtInst %float %67 NMax %400 %float_9_99999975en05
|
||||
%414 = OpCompositeConstruct %v4float %410 %410 %410 %410
|
||||
%412 = OpFDiv %v4float %409 %414
|
||||
%416 = OpLoad %59 %tex_out
|
||||
%418 = OpVectorShuffle %v2uint %coord_3 %coord_3 0 1
|
||||
%417 = OpBitcast %v2int %418
|
||||
OpImageWrite %416 %417 %412
|
||||
OpBranch %366
|
||||
%366 = OpLabel
|
||||
OpReturn
|
||||
OpFunctionEnd
|
||||
%export_level = OpFunction %void None %135
|
||||
%420 = OpLabel
|
||||
%422 = OpLoad %v3uint %coord_2
|
||||
%421 = OpFunctionCall %void %export_level_inner %422
|
||||
OpReturn
|
||||
OpFunctionEnd
|
|
@ -0,0 +1,144 @@
|
|||
var<private> rand_seed : vec2<f32>;
|
||||
|
||||
fn rand() -> f32 {
|
||||
rand_seed.x = fract((cos(dot(rand_seed, vec2<f32>(23.140779495, 232.616897583))) * 136.816802979));
|
||||
rand_seed.y = fract((cos(dot(rand_seed, vec2<f32>(54.478565216, 345.841522217))) * 534.764526367));
|
||||
return rand_seed.y;
|
||||
}
|
||||
|
||||
struct RenderParams {
|
||||
modelViewProjectionMatrix : mat4x4<f32>;
|
||||
right : vec3<f32>;
|
||||
up : vec3<f32>;
|
||||
};
|
||||
|
||||
[[binding(0), group(0)]] var<uniform> render_params : RenderParams;
|
||||
|
||||
struct VertexInput {
|
||||
[[location(0)]]
|
||||
position : vec3<f32>;
|
||||
[[location(1)]]
|
||||
color : vec4<f32>;
|
||||
[[location(2)]]
|
||||
quad_pos : vec2<f32>;
|
||||
};
|
||||
|
||||
struct VertexOutput {
|
||||
[[builtin(position)]]
|
||||
position : vec4<f32>;
|
||||
[[location(0)]]
|
||||
color : vec4<f32>;
|
||||
[[location(1)]]
|
||||
quad_pos : vec2<f32>;
|
||||
};
|
||||
|
||||
[[stage(vertex)]]
|
||||
fn vs_main(in : VertexInput) -> VertexOutput {
|
||||
var quad_pos = (mat2x3<f32>(render_params.right, render_params.up) * in.quad_pos);
|
||||
var position = (in.position + (quad_pos * 0.01));
|
||||
var out : VertexOutput;
|
||||
out.position = (render_params.modelViewProjectionMatrix * vec4<f32>(position, 1.0));
|
||||
out.color = in.color;
|
||||
out.quad_pos = in.quad_pos;
|
||||
return out;
|
||||
}
|
||||
|
||||
[[stage(fragment)]]
|
||||
fn fs_main(in : VertexOutput) -> [[location(0)]] vec4<f32> {
|
||||
var color = in.color;
|
||||
color.a = (color.a * max((1.0 - length(in.quad_pos)), 0.0));
|
||||
return color;
|
||||
}
|
||||
|
||||
struct SimulationParams {
|
||||
deltaTime : f32;
|
||||
seed : vec4<f32>;
|
||||
};
|
||||
|
||||
struct Particle {
|
||||
position : vec3<f32>;
|
||||
lifetime : f32;
|
||||
color : vec4<f32>;
|
||||
velocity : vec3<f32>;
|
||||
};
|
||||
|
||||
struct Particles {
|
||||
particles : array<Particle>;
|
||||
};
|
||||
|
||||
[[binding(0), group(0)]] var<uniform> sim_params : SimulationParams;
|
||||
|
||||
[[binding(1), group(0)]] var<storage, read_write> data : Particles;
|
||||
|
||||
[[binding(2), group(0)]] var texture : texture_2d<f32>;
|
||||
|
||||
[[stage(compute), workgroup_size(64)]]
|
||||
fn simulate([[builtin(global_invocation_id)]] GlobalInvocationID : vec3<u32>) {
|
||||
rand_seed = ((sim_params.seed.xy + vec2<f32>(GlobalInvocationID.xy)) * sim_params.seed.zw);
|
||||
let idx = GlobalInvocationID.x;
|
||||
var particle = data.particles[idx];
|
||||
particle.velocity.z = (particle.velocity.z - (sim_params.deltaTime * 0.5));
|
||||
particle.position = (particle.position + (sim_params.deltaTime * particle.velocity));
|
||||
particle.lifetime = (particle.lifetime - sim_params.deltaTime);
|
||||
particle.color.a = smoothStep(0.0, 0.5, particle.lifetime);
|
||||
if ((particle.lifetime < 0.0)) {
|
||||
var coord = vec2<i32>(0, 0);
|
||||
for(var level = (textureNumLevels(texture) - 1); (level > 0); level = (level - 1)) {
|
||||
let probabilites = textureLoad(texture, coord, level);
|
||||
let value = vec4<f32>(rand());
|
||||
let mask = ((value >= vec4<f32>(0.0, probabilites.xyz)) & (value < probabilites));
|
||||
coord = (coord * 2);
|
||||
coord.x = (coord.x + select(0, 1, any(mask.yw)));
|
||||
coord.y = (coord.y + select(0, 1, any(mask.zw)));
|
||||
}
|
||||
let uv = (vec2<f32>(coord) / vec2<f32>(textureDimensions(texture)));
|
||||
particle.position = vec3<f32>((((uv - 0.5) * 3.0) * vec2<f32>(1.0, -1.0)), 0.0);
|
||||
particle.color = textureLoad(texture, coord, 0);
|
||||
particle.velocity.x = ((rand() - 0.5) * 0.100000001);
|
||||
particle.velocity.y = ((rand() - 0.5) * 0.100000001);
|
||||
particle.velocity.z = (rand() * 0.300000012);
|
||||
particle.lifetime = (0.5 + (rand() * 2.0));
|
||||
}
|
||||
data.particles[idx] = particle;
|
||||
}
|
||||
|
||||
struct UBO {
|
||||
width : u32;
|
||||
};
|
||||
|
||||
struct Buffer {
|
||||
weights : array<f32>;
|
||||
};
|
||||
|
||||
[[binding(3), group(0)]] var<uniform> ubo : UBO;
|
||||
|
||||
[[binding(4), group(0)]] var<storage, read> buf_in : Buffer;
|
||||
|
||||
[[binding(5), group(0)]] var<storage, read_write> buf_out : Buffer;
|
||||
|
||||
[[binding(6), group(0)]] var tex_in : texture_2d<f32>;
|
||||
|
||||
[[binding(7), group(0)]] var tex_out : texture_storage_2d<rgba8unorm, write>;
|
||||
|
||||
[[stage(compute), workgroup_size(64)]]
|
||||
fn import_level([[builtin(global_invocation_id)]] coord : vec3<u32>) {
|
||||
_ = &(buf_in);
|
||||
let offset = (coord.x + (coord.y * ubo.width));
|
||||
buf_out.weights[offset] = textureLoad(tex_in, vec2<i32>(coord.xy), 0).w;
|
||||
}
|
||||
|
||||
[[stage(compute), workgroup_size(64)]]
|
||||
fn export_level([[builtin(global_invocation_id)]] coord : vec3<u32>) {
|
||||
if (all((coord.xy < vec2<u32>(textureDimensions(tex_out))))) {
|
||||
let dst_offset = (coord.x + (coord.y * ubo.width));
|
||||
let src_offset = ((coord.x * 2u) + ((coord.y * 2u) * ubo.width));
|
||||
let a = buf_in.weights[(src_offset + 0u)];
|
||||
let b = buf_in.weights[(src_offset + 1u)];
|
||||
let c = buf_in.weights[((src_offset + 0u) + ubo.width)];
|
||||
let d = buf_in.weights[((src_offset + 1u) + ubo.width)];
|
||||
let sum = dot(vec4<f32>(a, b, c, d), vec4<f32>(1.0));
|
||||
buf_out.weights[dst_offset] = (sum / 4.0);
|
||||
let probabilities = (vec4<f32>(a, (a + b), ((a + b) + c), sum) / max(sum, 0.0001));
|
||||
textureStore(tex_out, vec2<i32>(coord.xy), probabilities);
|
||||
}
|
||||
}
|
|
@ -0,0 +1,10 @@
|
|||
struct SB {
|
||||
data : array<i32>;
|
||||
};
|
||||
|
||||
[[group(0), binding(0)]] var<storage, read_write> buffer : SB;
|
||||
|
||||
[[stage(compute), workgroup_size(1, 2, 3)]]
|
||||
fn main([[builtin(global_invocation_id)]] id : vec3<u32>) {
|
||||
buffer.data[id.x] = buffer.data[id.x] + 1;
|
||||
}
|
|
@ -0,0 +1,15 @@
|
|||
RWByteAddressBuffer buffer : register(u0, space0);
|
||||
|
||||
struct tint_symbol_1 {
|
||||
uint3 id : SV_DispatchThreadID;
|
||||
};
|
||||
|
||||
void main_inner(uint3 id) {
|
||||
buffer.Store((4u * id.x), asuint((asint(buffer.Load((4u * id.x))) + 1)));
|
||||
}
|
||||
|
||||
[numthreads(1, 2, 3)]
|
||||
void main(tint_symbol_1 tint_symbol) {
|
||||
main_inner(tint_symbol.id);
|
||||
return;
|
||||
}
|
|
@ -0,0 +1,16 @@
|
|||
#include <metal_stdlib>
|
||||
|
||||
using namespace metal;
|
||||
struct SB {
|
||||
/* 0x0000 */ int data[1];
|
||||
};
|
||||
|
||||
void tint_symbol_1_inner(uint3 id, device SB* const tint_symbol_2) {
|
||||
(*(tint_symbol_2)).data[id[0]] = as_type<int>((as_type<uint>((*(tint_symbol_2)).data[id[0]]) + as_type<uint>(1)));
|
||||
}
|
||||
|
||||
kernel void tint_symbol_1(device SB* tint_symbol_3 [[buffer(0)]], uint3 id [[thread_position_in_grid]]) {
|
||||
tint_symbol_1_inner(id, tint_symbol_3);
|
||||
return;
|
||||
}
|
||||
|
|
@ -0,0 +1,55 @@
|
|||
; SPIR-V
|
||||
; Version: 1.3
|
||||
; Generator: Google Tint Compiler; 0
|
||||
; Bound: 29
|
||||
; Schema: 0
|
||||
OpCapability Shader
|
||||
OpMemoryModel Logical GLSL450
|
||||
OpEntryPoint GLCompute %main "main" %id_1
|
||||
OpExecutionMode %main LocalSize 1 2 3
|
||||
OpName %id_1 "id_1"
|
||||
OpName %SB "SB"
|
||||
OpMemberName %SB 0 "data"
|
||||
OpName %buffer "buffer"
|
||||
OpName %main_inner "main_inner"
|
||||
OpName %id "id"
|
||||
OpName %main "main"
|
||||
OpDecorate %id_1 BuiltIn GlobalInvocationId
|
||||
OpDecorate %SB Block
|
||||
OpMemberDecorate %SB 0 Offset 0
|
||||
OpDecorate %_runtimearr_int ArrayStride 4
|
||||
OpDecorate %buffer DescriptorSet 0
|
||||
OpDecorate %buffer Binding 0
|
||||
%uint = OpTypeInt 32 0
|
||||
%v3uint = OpTypeVector %uint 3
|
||||
%_ptr_Input_v3uint = OpTypePointer Input %v3uint
|
||||
%id_1 = OpVariable %_ptr_Input_v3uint Input
|
||||
%int = OpTypeInt 32 1
|
||||
%_runtimearr_int = OpTypeRuntimeArray %int
|
||||
%SB = OpTypeStruct %_runtimearr_int
|
||||
%_ptr_StorageBuffer_SB = OpTypePointer StorageBuffer %SB
|
||||
%buffer = OpVariable %_ptr_StorageBuffer_SB StorageBuffer
|
||||
%void = OpTypeVoid
|
||||
%10 = OpTypeFunction %void %v3uint
|
||||
%uint_0 = OpConstant %uint 0
|
||||
%_ptr_StorageBuffer_int = OpTypePointer StorageBuffer %int
|
||||
%int_1 = OpConstant %int 1
|
||||
%24 = OpTypeFunction %void
|
||||
%main_inner = OpFunction %void None %10
|
||||
%id = OpFunctionParameter %v3uint
|
||||
%14 = OpLabel
|
||||
%16 = OpCompositeExtract %uint %id 0
|
||||
%18 = OpAccessChain %_ptr_StorageBuffer_int %buffer %uint_0 %16
|
||||
%19 = OpCompositeExtract %uint %id 0
|
||||
%20 = OpAccessChain %_ptr_StorageBuffer_int %buffer %uint_0 %19
|
||||
%21 = OpLoad %int %20
|
||||
%23 = OpIAdd %int %21 %int_1
|
||||
OpStore %18 %23
|
||||
OpReturn
|
||||
OpFunctionEnd
|
||||
%main = OpFunction %void None %24
|
||||
%26 = OpLabel
|
||||
%28 = OpLoad %v3uint %id_1
|
||||
%27 = OpFunctionCall %void %main_inner %28
|
||||
OpReturn
|
||||
OpFunctionEnd
|
|
@ -0,0 +1,10 @@
|
|||
struct SB {
|
||||
data : array<i32>;
|
||||
};
|
||||
|
||||
[[group(0), binding(0)]] var<storage, read_write> buffer : SB;
|
||||
|
||||
[[stage(compute), workgroup_size(1, 2, 3)]]
|
||||
fn main([[builtin(global_invocation_id)]] id : vec3<u32>) {
|
||||
buffer.data[id.x] = (buffer.data[id.x] + 1);
|
||||
}
|
|
@ -0,0 +1,12 @@
|
|||
struct Input {
|
||||
[[location(0)]] color: vec4<f32>;
|
||||
};
|
||||
|
||||
struct Output {
|
||||
[[location(0)]] color: vec4<f32>;
|
||||
};
|
||||
|
||||
[[stage(fragment)]]
|
||||
fn main(in : Input) -> Output {
|
||||
return Output(in.color);
|
||||
}
|
|
@ -0,0 +1,25 @@
|
|||
struct Input {
|
||||
float4 color;
|
||||
};
|
||||
struct Output {
|
||||
float4 color;
|
||||
};
|
||||
struct tint_symbol_2 {
|
||||
float4 color : TEXCOORD0;
|
||||
};
|
||||
struct tint_symbol_3 {
|
||||
float4 color : SV_Target0;
|
||||
};
|
||||
|
||||
Output main_inner(Input tint_symbol) {
|
||||
const Output tint_symbol_4 = {tint_symbol.color};
|
||||
return tint_symbol_4;
|
||||
}
|
||||
|
||||
tint_symbol_3 main(tint_symbol_2 tint_symbol_1) {
|
||||
const Input tint_symbol_5 = {tint_symbol_1.color};
|
||||
const Output inner_result = main_inner(tint_symbol_5);
|
||||
tint_symbol_3 wrapper_result = (tint_symbol_3)0;
|
||||
wrapper_result.color = inner_result.color;
|
||||
return wrapper_result;
|
||||
}
|
|
@ -0,0 +1,29 @@
|
|||
#include <metal_stdlib>
|
||||
|
||||
using namespace metal;
|
||||
struct Input {
|
||||
float4 color;
|
||||
};
|
||||
struct Output {
|
||||
float4 color;
|
||||
};
|
||||
struct tint_symbol_2 {
|
||||
float4 color [[user(locn0)]];
|
||||
};
|
||||
struct tint_symbol_3 {
|
||||
float4 color [[color(0)]];
|
||||
};
|
||||
|
||||
Output tint_symbol_inner(Input in) {
|
||||
Output const tint_symbol_4 = {.color=in.color};
|
||||
return tint_symbol_4;
|
||||
}
|
||||
|
||||
fragment tint_symbol_3 tint_symbol(tint_symbol_2 tint_symbol_1 [[stage_in]]) {
|
||||
Input const tint_symbol_5 = {.color=tint_symbol_1.color};
|
||||
Output const inner_result = tint_symbol_inner(tint_symbol_5);
|
||||
tint_symbol_3 wrapper_result = {};
|
||||
wrapper_result.color = inner_result.color;
|
||||
return wrapper_result;
|
||||
}
|
||||
|
|
@ -0,0 +1,50 @@
|
|||
; SPIR-V
|
||||
; Version: 1.3
|
||||
; Generator: Google Tint Compiler; 0
|
||||
; Bound: 24
|
||||
; Schema: 0
|
||||
OpCapability Shader
|
||||
OpMemoryModel Logical GLSL450
|
||||
OpEntryPoint Fragment %main "main" %color_1 %color_2
|
||||
OpExecutionMode %main OriginUpperLeft
|
||||
OpName %color_1 "color_1"
|
||||
OpName %color_2 "color_2"
|
||||
OpName %Output "Output"
|
||||
OpMemberName %Output 0 "color"
|
||||
OpName %Input "Input"
|
||||
OpMemberName %Input 0 "color"
|
||||
OpName %main_inner "main_inner"
|
||||
OpName %in "in"
|
||||
OpName %main "main"
|
||||
OpDecorate %color_1 Location 0
|
||||
OpDecorate %color_2 Location 0
|
||||
OpMemberDecorate %Output 0 Offset 0
|
||||
OpMemberDecorate %Input 0 Offset 0
|
||||
%float = OpTypeFloat 32
|
||||
%v4float = OpTypeVector %float 4
|
||||
%_ptr_Input_v4float = OpTypePointer Input %v4float
|
||||
%color_1 = OpVariable %_ptr_Input_v4float Input
|
||||
%_ptr_Output_v4float = OpTypePointer Output %v4float
|
||||
%7 = OpConstantNull %v4float
|
||||
%color_2 = OpVariable %_ptr_Output_v4float Output %7
|
||||
%Output = OpTypeStruct %v4float
|
||||
%Input = OpTypeStruct %v4float
|
||||
%8 = OpTypeFunction %Output %Input
|
||||
%void = OpTypeVoid
|
||||
%16 = OpTypeFunction %void
|
||||
%main_inner = OpFunction %Output None %8
|
||||
%in = OpFunctionParameter %Input
|
||||
%13 = OpLabel
|
||||
%14 = OpCompositeExtract %v4float %in 0
|
||||
%15 = OpCompositeConstruct %Output %14
|
||||
OpReturnValue %15
|
||||
OpFunctionEnd
|
||||
%main = OpFunction %void None %16
|
||||
%19 = OpLabel
|
||||
%21 = OpLoad %v4float %color_1
|
||||
%22 = OpCompositeConstruct %Input %21
|
||||
%20 = OpFunctionCall %Output %main_inner %22
|
||||
%23 = OpCompositeExtract %v4float %20 0
|
||||
OpStore %color_2 %23
|
||||
OpReturn
|
||||
OpFunctionEnd
|
|
@ -0,0 +1,14 @@
|
|||
struct Input {
|
||||
[[location(0)]]
|
||||
color : vec4<f32>;
|
||||
};
|
||||
|
||||
struct Output {
|
||||
[[location(0)]]
|
||||
color : vec4<f32>;
|
||||
};
|
||||
|
||||
[[stage(fragment)]]
|
||||
fn main(in : Input) -> Output {
|
||||
return Output(in.color);
|
||||
}
|
|
@ -0,0 +1,12 @@
|
|||
struct Input {
|
||||
[[location(0)]] position: vec4<f32>;
|
||||
};
|
||||
|
||||
struct Output {
|
||||
[[builtin(position)]] position : vec4<f32>;
|
||||
};
|
||||
|
||||
[[stage(vertex)]]
|
||||
fn main(in : Input) -> Output {
|
||||
return Output(in.position);
|
||||
}
|
|
@ -0,0 +1,25 @@
|
|||
struct Input {
|
||||
float4 position;
|
||||
};
|
||||
struct Output {
|
||||
float4 position;
|
||||
};
|
||||
struct tint_symbol_2 {
|
||||
float4 position : TEXCOORD0;
|
||||
};
|
||||
struct tint_symbol_3 {
|
||||
float4 position : SV_Position;
|
||||
};
|
||||
|
||||
Output main_inner(Input tint_symbol) {
|
||||
const Output tint_symbol_4 = {tint_symbol.position};
|
||||
return tint_symbol_4;
|
||||
}
|
||||
|
||||
tint_symbol_3 main(tint_symbol_2 tint_symbol_1) {
|
||||
const Input tint_symbol_5 = {tint_symbol_1.position};
|
||||
const Output inner_result = main_inner(tint_symbol_5);
|
||||
tint_symbol_3 wrapper_result = (tint_symbol_3)0;
|
||||
wrapper_result.position = inner_result.position;
|
||||
return wrapper_result;
|
||||
}
|
|
@ -0,0 +1,29 @@
|
|||
#include <metal_stdlib>
|
||||
|
||||
using namespace metal;
|
||||
struct Input {
|
||||
float4 position;
|
||||
};
|
||||
struct Output {
|
||||
float4 position;
|
||||
};
|
||||
struct tint_symbol_2 {
|
||||
float4 position [[attribute(0)]];
|
||||
};
|
||||
struct tint_symbol_3 {
|
||||
float4 position [[position]];
|
||||
};
|
||||
|
||||
Output tint_symbol_inner(Input in) {
|
||||
Output const tint_symbol_4 = {.position=in.position};
|
||||
return tint_symbol_4;
|
||||
}
|
||||
|
||||
vertex tint_symbol_3 tint_symbol(tint_symbol_2 tint_symbol_1 [[stage_in]]) {
|
||||
Input const tint_symbol_5 = {.position=tint_symbol_1.position};
|
||||
Output const inner_result = tint_symbol_inner(tint_symbol_5);
|
||||
tint_symbol_3 wrapper_result = {};
|
||||
wrapper_result.position = inner_result.position;
|
||||
return wrapper_result;
|
||||
}
|
||||
|
|
@ -0,0 +1,56 @@
|
|||
; SPIR-V
|
||||
; Version: 1.3
|
||||
; Generator: Google Tint Compiler; 0
|
||||
; Bound: 28
|
||||
; Schema: 0
|
||||
OpCapability Shader
|
||||
OpMemoryModel Logical GLSL450
|
||||
OpEntryPoint Vertex %main "main" %position_1 %position_2 %vertex_point_size
|
||||
OpName %position_1 "position_1"
|
||||
OpName %position_2 "position_2"
|
||||
OpName %vertex_point_size "vertex_point_size"
|
||||
OpName %Output "Output"
|
||||
OpMemberName %Output 0 "position"
|
||||
OpName %Input "Input"
|
||||
OpMemberName %Input 0 "position"
|
||||
OpName %main_inner "main_inner"
|
||||
OpName %in "in"
|
||||
OpName %main "main"
|
||||
OpDecorate %position_1 Location 0
|
||||
OpDecorate %position_2 BuiltIn Position
|
||||
OpDecorate %vertex_point_size BuiltIn PointSize
|
||||
OpMemberDecorate %Output 0 Offset 0
|
||||
OpMemberDecorate %Input 0 Offset 0
|
||||
%float = OpTypeFloat 32
|
||||
%v4float = OpTypeVector %float 4
|
||||
%_ptr_Input_v4float = OpTypePointer Input %v4float
|
||||
%position_1 = OpVariable %_ptr_Input_v4float Input
|
||||
%_ptr_Output_v4float = OpTypePointer Output %v4float
|
||||
%7 = OpConstantNull %v4float
|
||||
%position_2 = OpVariable %_ptr_Output_v4float Output %7
|
||||
%_ptr_Output_float = OpTypePointer Output %float
|
||||
%10 = OpConstantNull %float
|
||||
%vertex_point_size = OpVariable %_ptr_Output_float Output %10
|
||||
%Output = OpTypeStruct %v4float
|
||||
%Input = OpTypeStruct %v4float
|
||||
%11 = OpTypeFunction %Output %Input
|
||||
%void = OpTypeVoid
|
||||
%19 = OpTypeFunction %void
|
||||
%float_1 = OpConstant %float 1
|
||||
%main_inner = OpFunction %Output None %11
|
||||
%in = OpFunctionParameter %Input
|
||||
%16 = OpLabel
|
||||
%17 = OpCompositeExtract %v4float %in 0
|
||||
%18 = OpCompositeConstruct %Output %17
|
||||
OpReturnValue %18
|
||||
OpFunctionEnd
|
||||
%main = OpFunction %void None %19
|
||||
%22 = OpLabel
|
||||
%24 = OpLoad %v4float %position_1
|
||||
%25 = OpCompositeConstruct %Input %24
|
||||
%23 = OpFunctionCall %Output %main_inner %25
|
||||
%26 = OpCompositeExtract %v4float %23 0
|
||||
OpStore %position_2 %26
|
||||
OpStore %vertex_point_size %float_1
|
||||
OpReturn
|
||||
OpFunctionEnd
|
|
@ -0,0 +1,14 @@
|
|||
struct Input {
|
||||
[[location(0)]]
|
||||
position : vec4<f32>;
|
||||
};
|
||||
|
||||
struct Output {
|
||||
[[builtin(position)]]
|
||||
position : vec4<f32>;
|
||||
};
|
||||
|
||||
[[stage(vertex)]]
|
||||
fn main(in : Input) -> Output {
|
||||
return Output(in.position);
|
||||
}
|
|
@ -12,6 +12,11 @@
|
|||
# See the License for the specific language governing permissions and
|
||||
# limitations under the License.
|
||||
|
||||
if (${TINT_BUILD_BENCHMARKS})
|
||||
set(BENCHMARK_ENABLE_TESTING FALSE CACHE BOOL FALSE FORCE)
|
||||
add_subdirectory(${CMAKE_CURRENT_SOURCE_DIR}/benchmark EXCLUDE_FROM_ALL)
|
||||
endif()
|
||||
|
||||
if (${TINT_BUILD_TESTS} AND NOT TARGET gmock)
|
||||
set(gtest_force_shared_crt ON CACHE BOOL "Controls whether a shared run-time library should be used even when Google Test is built as static library" FORCE)
|
||||
add_subdirectory(${CMAKE_CURRENT_SOURCE_DIR}/googletest EXCLUDE_FROM_ALL)
|
||||
|
|
|
@ -0,0 +1,33 @@
|
|||
#!/usr/bin/env bash
|
||||
# Copyright 2022 The Tint Authors
|
||||
#
|
||||
# Licensed under the Apache License, Version 2.0 (the "License");
|
||||
# you may not use this file except in compliance with the License.
|
||||
# You may obtain a copy of the License at
|
||||
#
|
||||
# http://www.apache.org/licenses/LICENSE-2.0
|
||||
#
|
||||
# Unless required by applicable law or agreed to in writing, software
|
||||
# distributed under the License is distributed on an "AS IS" BASIS,
|
||||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
# See the License for the specific language governing permissions and
|
||||
# limitations under the License.
|
||||
|
||||
set -e # Fail on any error.
|
||||
|
||||
if [ ! -x "$(which go)" ] ; then
|
||||
echo "error: go needs to be on \$PATH to use $0"
|
||||
exit 1
|
||||
fi
|
||||
|
||||
SCRIPT_DIR="$( cd "$( dirname "${BASH_SOURCE[0]}")" >/dev/null 2>&1 && pwd )"
|
||||
ROOT_DIR="$( cd "${SCRIPT_DIR}/.." >/dev/null 2>&1 && pwd )"
|
||||
BINARY="${SCRIPT_DIR}/bin/benchdiff"
|
||||
|
||||
# Rebuild the binary.
|
||||
# Note, go caches build artifacts, so this is quick for repeat calls
|
||||
pushd "${SCRIPT_DIR}/src/cmd/benchdiff" > /dev/null
|
||||
go build -o "${BINARY}" main.go
|
||||
popd > /dev/null
|
||||
|
||||
"${BINARY}" "$@"
|
|
@ -0,0 +1,150 @@
|
|||
// Copyright 2022 The Tint Authors
|
||||
//
|
||||
// Licensed under the Apache License, Version 2.0 (the "License");
|
||||
// you may not use this file except in compliance with the License.
|
||||
// You may obtain a copy of the License at
|
||||
//
|
||||
// https://www.apache.org/licenses/LICENSE-2.0
|
||||
//
|
||||
// Unless required by applicable law or agreed to in writing, software
|
||||
// distributed under the License is distributed on an "AS IS" BASIS,
|
||||
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
// See the License for the specific language governing permissions and
|
||||
// limitations under the License.
|
||||
|
||||
// Package bench provides types and methods for parsing Google benchmark results.
|
||||
package bench
|
||||
|
||||
import (
|
||||
"encoding/json"
|
||||
"errors"
|
||||
"fmt"
|
||||
"regexp"
|
||||
"strconv"
|
||||
"strings"
|
||||
"time"
|
||||
)
|
||||
|
||||
// Test holds the results of a single benchmark test.
|
||||
type Test struct {
|
||||
Name string
|
||||
NumTasks uint
|
||||
NumThreads uint
|
||||
Duration time.Duration
|
||||
Iterations uint
|
||||
}
|
||||
|
||||
var testVarRE = regexp.MustCompile(`([\w])+:([0-9]+)`)
|
||||
|
||||
func (t *Test) parseName() {
|
||||
for _, match := range testVarRE.FindAllStringSubmatch(t.Name, -1) {
|
||||
if len(match) != 3 {
|
||||
continue
|
||||
}
|
||||
n, err := strconv.Atoi(match[2])
|
||||
if err != nil {
|
||||
continue
|
||||
}
|
||||
switch match[1] {
|
||||
case "threads":
|
||||
t.NumThreads = uint(n)
|
||||
case "tasks":
|
||||
t.NumTasks = uint(n)
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
// Benchmark holds a set of benchmark test results.
|
||||
type Benchmark struct {
|
||||
Tests []Test
|
||||
}
|
||||
|
||||
// Parse parses the benchmark results from the string s.
|
||||
// Parse will handle the json and 'console' formats.
|
||||
func Parse(s string) (Benchmark, error) {
|
||||
type Parser = func(s string) (Benchmark, error)
|
||||
for _, parser := range []Parser{parseConsole, parseJSON} {
|
||||
b, err := parser(s)
|
||||
switch err {
|
||||
case nil:
|
||||
return b, nil
|
||||
case errWrongFormat:
|
||||
default:
|
||||
return Benchmark{}, err
|
||||
}
|
||||
}
|
||||
|
||||
return Benchmark{}, errors.New("Unrecognised file format")
|
||||
}
|
||||
|
||||
var errWrongFormat = errors.New("Wrong format")
|
||||
var consoleLineRE = regexp.MustCompile(`([\w/:]+)\s+([0-9]+(?:.[0-9]+)?) ns\s+[0-9]+(?:.[0-9]+) ns\s+([0-9]+)`)
|
||||
|
||||
func parseConsole(s string) (Benchmark, error) {
|
||||
blocks := strings.Split(s, "------------------------------------------------------------------------------------------")
|
||||
if len(blocks) != 3 {
|
||||
return Benchmark{}, errWrongFormat
|
||||
}
|
||||
|
||||
lines := strings.Split(blocks[2], "\n")
|
||||
b := Benchmark{
|
||||
Tests: make([]Test, 0, len(lines)),
|
||||
}
|
||||
for _, line := range lines {
|
||||
if len(line) == 0 {
|
||||
continue
|
||||
}
|
||||
matches := consoleLineRE.FindStringSubmatch(line)
|
||||
if len(matches) != 4 {
|
||||
return Benchmark{}, fmt.Errorf("Unable to parse the line:\n" + line)
|
||||
}
|
||||
ns, err := strconv.ParseFloat(matches[2], 64)
|
||||
if err != nil {
|
||||
return Benchmark{}, fmt.Errorf("Unable to parse the duration: " + matches[2])
|
||||
}
|
||||
iterations, err := strconv.Atoi(matches[3])
|
||||
if err != nil {
|
||||
return Benchmark{}, fmt.Errorf("Unable to parse the number of iterations: " + matches[3])
|
||||
}
|
||||
|
||||
t := Test{
|
||||
Name: matches[1],
|
||||
Duration: time.Nanosecond * time.Duration(ns),
|
||||
Iterations: uint(iterations),
|
||||
}
|
||||
t.parseName()
|
||||
b.Tests = append(b.Tests, t)
|
||||
}
|
||||
return b, nil
|
||||
}
|
||||
|
||||
func parseJSON(s string) (Benchmark, error) {
|
||||
type T struct {
|
||||
Name string `json:"name"`
|
||||
Iterations uint `json:"iterations"`
|
||||
Time float64 `json:"real_time"`
|
||||
}
|
||||
type B struct {
|
||||
Tests []T `json:"benchmarks"`
|
||||
}
|
||||
b := B{}
|
||||
d := json.NewDecoder(strings.NewReader(s))
|
||||
if err := d.Decode(&b); err != nil {
|
||||
return Benchmark{}, err
|
||||
}
|
||||
|
||||
out := Benchmark{
|
||||
Tests: make([]Test, len(b.Tests)),
|
||||
}
|
||||
for i, test := range b.Tests {
|
||||
t := Test{
|
||||
Name: test.Name,
|
||||
Duration: time.Nanosecond * time.Duration(int64(test.Time)),
|
||||
Iterations: test.Iterations,
|
||||
}
|
||||
t.parseName()
|
||||
out.Tests[i] = t
|
||||
}
|
||||
|
||||
return out, nil
|
||||
}
|
|
@ -0,0 +1,177 @@
|
|||
// Copyright 2022 The Tint Authors.
|
||||
//
|
||||
// Licensed under the Apache License, Version 2.0 (the "License");
|
||||
// you may not use this file except in compliance with the License.
|
||||
// You may obtain a copy of the License at
|
||||
//
|
||||
// https://www.apache.org/licenses/LICENSE-2.0
|
||||
//
|
||||
// Unless required by applicable law or agreed to in writing, software
|
||||
// distributed under the License is distributed on an "AS IS" BASIS,
|
||||
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
// See the License for the specific language governing permissions and
|
||||
// limitations under the License.
|
||||
|
||||
// benchdiff is a tool that compares two Google benchmark results and displays
|
||||
// sorted performance differences.
|
||||
package main
|
||||
|
||||
import (
|
||||
"errors"
|
||||
"flag"
|
||||
"fmt"
|
||||
"io/ioutil"
|
||||
"os"
|
||||
"path/filepath"
|
||||
"sort"
|
||||
"strings"
|
||||
"text/tabwriter"
|
||||
"time"
|
||||
|
||||
"dawn.googlesource.com/tint/tools/src/bench"
|
||||
)
|
||||
|
||||
var (
|
||||
minDiff = flag.Duration("min-diff", time.Microsecond*10, "Filter away time diffs less than this duration")
|
||||
minRelDiff = flag.Float64("min-rel-diff", 0.01, "Filter away absolute relative diffs between [1, 1+x]")
|
||||
)
|
||||
|
||||
func main() {
|
||||
flag.ErrHelp = errors.New("benchdiff is a tool to compare two benchmark results")
|
||||
flag.Parse()
|
||||
flag.Usage = func() {
|
||||
fmt.Fprintln(os.Stderr, "benchdiff <benchmark-a> <benchmark-b>")
|
||||
flag.PrintDefaults()
|
||||
}
|
||||
|
||||
args := flag.Args()
|
||||
if len(args) < 2 {
|
||||
flag.Usage()
|
||||
os.Exit(1)
|
||||
}
|
||||
|
||||
pathA, pathB := args[0], args[1]
|
||||
|
||||
if err := run(pathA, pathB); err != nil {
|
||||
fmt.Fprintln(os.Stderr, err)
|
||||
os.Exit(-1)
|
||||
}
|
||||
}
|
||||
|
||||
func run(pathA, pathB string) error {
|
||||
fileA, err := ioutil.ReadFile(pathA)
|
||||
if err != nil {
|
||||
return err
|
||||
}
|
||||
benchA, err := bench.Parse(string(fileA))
|
||||
if err != nil {
|
||||
return err
|
||||
}
|
||||
|
||||
fileB, err := ioutil.ReadFile(pathB)
|
||||
if err != nil {
|
||||
return err
|
||||
}
|
||||
benchB, err := bench.Parse(string(fileB))
|
||||
if err != nil {
|
||||
return err
|
||||
}
|
||||
|
||||
compare(benchA, benchB, fileName(pathA), fileName(pathB))
|
||||
|
||||
return nil
|
||||
}
|
||||
|
||||
func fileName(path string) string {
|
||||
_, name := filepath.Split(path)
|
||||
return name
|
||||
}
|
||||
|
||||
func compare(benchA, benchB bench.Benchmark, nameA, nameB string) {
|
||||
type times struct {
|
||||
a time.Duration
|
||||
b time.Duration
|
||||
}
|
||||
byName := map[string]times{}
|
||||
for _, test := range benchA.Tests {
|
||||
byName[test.Name] = times{a: test.Duration}
|
||||
}
|
||||
for _, test := range benchB.Tests {
|
||||
t := byName[test.Name]
|
||||
t.b = test.Duration
|
||||
byName[test.Name] = t
|
||||
}
|
||||
|
||||
type delta struct {
|
||||
name string
|
||||
times times
|
||||
relDiff float64
|
||||
absRelDiff float64
|
||||
}
|
||||
deltas := []delta{}
|
||||
for name, times := range byName {
|
||||
if times.a == 0 || times.b == 0 {
|
||||
continue // Assuming test was missing from a or b
|
||||
}
|
||||
diff := times.b - times.a
|
||||
absDiff := diff
|
||||
if absDiff < 0 {
|
||||
absDiff = -absDiff
|
||||
}
|
||||
if absDiff < *minDiff {
|
||||
continue
|
||||
}
|
||||
|
||||
relDiff := float64(times.b) / float64(times.a)
|
||||
absRelDiff := relDiff
|
||||
if absRelDiff < 1 {
|
||||
absRelDiff = 1.0 / absRelDiff
|
||||
}
|
||||
if absRelDiff < (1.0 + *minRelDiff) {
|
||||
continue
|
||||
}
|
||||
|
||||
d := delta{
|
||||
name: name,
|
||||
times: times,
|
||||
relDiff: relDiff,
|
||||
absRelDiff: absRelDiff,
|
||||
}
|
||||
deltas = append(deltas, d)
|
||||
}
|
||||
|
||||
sort.Slice(deltas, func(i, j int) bool { return deltas[j].relDiff < deltas[i].relDiff })
|
||||
|
||||
fmt.Println("A:", nameA)
|
||||
fmt.Println("B:", nameB)
|
||||
fmt.Println()
|
||||
|
||||
buf := strings.Builder{}
|
||||
{
|
||||
w := tabwriter.NewWriter(&buf, 1, 1, 0, ' ', 0)
|
||||
fmt.Fprintln(w, "Test name\t | Δ (A → B)\t | % (A → B)\t | % (B → A)\t | × (A → B)\t | × (B → A)\t | A \t | B")
|
||||
fmt.Fprintln(w, "\t-+\t-+\t-+\t-+\t-+\t-+\t-+\t-")
|
||||
for _, delta := range deltas {
|
||||
a2b := delta.times.b - delta.times.a
|
||||
fmt.Fprintf(w, "%v \t | %v \t | %+2.1f%% \t | %+2.1f%% \t | %+.4f \t | %+.4f \t | %v \t | %v \t|\n",
|
||||
delta.name,
|
||||
a2b, // Δ (A → B)
|
||||
100*float64(a2b)/float64(delta.times.a), // % (A → B)
|
||||
100*float64(-a2b)/float64(delta.times.b), // % (B → A)
|
||||
float64(delta.times.b)/float64(delta.times.a), // × (A → B)
|
||||
float64(delta.times.a)/float64(delta.times.b), // × (B → A)
|
||||
delta.times.a, // A
|
||||
delta.times.b, // B
|
||||
)
|
||||
}
|
||||
w.Flush()
|
||||
}
|
||||
|
||||
// Split the table by line so we can add in a header line
|
||||
lines := strings.Split(buf.String(), "\n")
|
||||
fmt.Println(lines[0])
|
||||
fmt.Println(strings.ReplaceAll(lines[1], " ", "-"))
|
||||
for _, l := range lines[2:] {
|
||||
fmt.Println(l)
|
||||
}
|
||||
}
|
Loading…
Reference in New Issue