mirror of
				https://github.com/encounter/dawn-cmake.git
				synced 2025-10-26 11:40:29 +00:00 
			
		
		
		
	benchmarks: Add a basic set of benchmarks
Add google benchmark to the DEPs. Implement a basic set of benchmarks for each of the writers and the WGSL parser. Add build rules for CMake. GN build rules TODO. Add a simple go tool (ported from Marl) to diff two benchmarks. Less noisy than the one provided by google benchmark. Bug: tint:1378 Change-Id: I73cf92c5d9fd2d3bfac8f264864fd774afbd5d01 Reviewed-on: https://dawn-review.googlesource.com/c/tint/+/76840 Kokoro: Kokoro <noreply+kokoro@google.com> Reviewed-by: Ryan Harrison <rharrison@chromium.org> Commit-Queue: Ben Clayton <bclayton@chromium.org>
This commit is contained in:
		
							parent
							
								
									dcb24cea41
								
							
						
					
					
						commit
						be2362b18c
					
				| @ -81,6 +81,7 @@ option_if_not_defined(TINT_BUILD_FUZZERS "Build fuzzers" OFF) | ||||
| option_if_not_defined(TINT_BUILD_SPIRV_TOOLS_FUZZER "Build SPIRV-Tools fuzzer" OFF) | ||||
| option_if_not_defined(TINT_BUILD_AST_FUZZER "Build AST fuzzer" OFF) | ||||
| option_if_not_defined(TINT_BUILD_REGEX_FUZZER "Build regex fuzzer" OFF) | ||||
| option_if_not_defined(TINT_BUILD_BENCHMARKS "Build benchmarks" OFF) | ||||
| option_if_not_defined(TINT_BUILD_TESTS "Build tests" ${TINT_BUILD_TESTS_DEFAULT}) | ||||
| option_if_not_defined(TINT_BUILD_AS_OTHER_OS "Override OS detection to force building of *_other.cc files" OFF) | ||||
| option_if_not_defined(TINT_BUILD_REMOTE_COMPILE "Build the remote-compile tool for validating shaders on a remote machine" OFF) | ||||
| @ -111,6 +112,7 @@ message(STATUS "Tint build fuzzers: ${TINT_BUILD_FUZZERS}") | ||||
| message(STATUS "Tint build SPIRV-Tools fuzzer: ${TINT_BUILD_SPIRV_TOOLS_FUZZER}") | ||||
| message(STATUS "Tint build AST fuzzer: ${TINT_BUILD_AST_FUZZER}") | ||||
| message(STATUS "Tint build regex fuzzer: ${TINT_BUILD_REGEX_FUZZER}") | ||||
| message(STATUS "Tint build benchmarks: ${TINT_BUILD_BENCHMARKS}") | ||||
| message(STATUS "Tint build tests: ${TINT_BUILD_TESTS}") | ||||
| message(STATUS "Tint build with ASAN: ${TINT_ENABLE_ASAN}") | ||||
| message(STATUS "Tint build with MSAN: ${TINT_ENABLE_MSAN}") | ||||
| @ -254,7 +256,7 @@ if(${TINT_BUILD_DOCS}) | ||||
|   endif(DOXYGEN_FOUND) | ||||
| endif() | ||||
| 
 | ||||
| function(tint_default_compile_options TARGET) | ||||
| function(tint_core_compile_options TARGET) | ||||
|   target_include_directories(${TARGET} PUBLIC "${TINT_ROOT_SOURCE_DIR}") | ||||
|   target_include_directories(${TARGET} PUBLIC "${TINT_ROOT_SOURCE_DIR}/include") | ||||
| 
 | ||||
| @ -263,20 +265,48 @@ function(tint_default_compile_options TARGET) | ||||
|         "${TINT_ROOT_SOURCE_DIR}/third_party/spirv-headers/include") | ||||
|   endif() | ||||
| 
 | ||||
|   target_compile_definitions(${TARGET} PUBLIC | ||||
|       -DTINT_BUILD_SPV_READER=$<BOOL:${TINT_BUILD_SPV_READER}>) | ||||
|   target_compile_definitions(${TARGET} PUBLIC | ||||
|       -DTINT_BUILD_WGSL_READER=$<BOOL:${TINT_BUILD_WGSL_READER}>) | ||||
|   target_compile_definitions(${TARGET} PUBLIC | ||||
|       -DTINT_BUILD_GLSL_WRITER=$<BOOL:${TINT_BUILD_GLSL_WRITER}>) | ||||
|   target_compile_definitions(${TARGET} PUBLIC | ||||
|       -DTINT_BUILD_HLSL_WRITER=$<BOOL:${TINT_BUILD_HLSL_WRITER}>) | ||||
|   target_compile_definitions(${TARGET} PUBLIC | ||||
|       -DTINT_BUILD_MSL_WRITER=$<BOOL:${TINT_BUILD_MSL_WRITER}>) | ||||
|   target_compile_definitions(${TARGET} PUBLIC | ||||
|       -DTINT_BUILD_SPV_WRITER=$<BOOL:${TINT_BUILD_SPV_WRITER}>) | ||||
|   target_compile_definitions(${TARGET} PUBLIC | ||||
|       -DTINT_BUILD_WGSL_WRITER=$<BOOL:${TINT_BUILD_WGSL_WRITER}>) | ||||
|   target_compile_definitions(${TARGET} PUBLIC -DTINT_BUILD_SPV_READER=$<BOOL:${TINT_BUILD_SPV_READER}>) | ||||
|   target_compile_definitions(${TARGET} PUBLIC -DTINT_BUILD_WGSL_READER=$<BOOL:${TINT_BUILD_WGSL_READER}>) | ||||
|   target_compile_definitions(${TARGET} PUBLIC -DTINT_BUILD_GLSL_WRITER=$<BOOL:${TINT_BUILD_GLSL_WRITER}>) | ||||
|   target_compile_definitions(${TARGET} PUBLIC -DTINT_BUILD_HLSL_WRITER=$<BOOL:${TINT_BUILD_HLSL_WRITER}>) | ||||
|   target_compile_definitions(${TARGET} PUBLIC -DTINT_BUILD_MSL_WRITER=$<BOOL:${TINT_BUILD_MSL_WRITER}>) | ||||
|   target_compile_definitions(${TARGET} PUBLIC -DTINT_BUILD_SPV_WRITER=$<BOOL:${TINT_BUILD_SPV_WRITER}>) | ||||
|   target_compile_definitions(${TARGET} PUBLIC -DTINT_BUILD_WGSL_WRITER=$<BOOL:${TINT_BUILD_WGSL_WRITER}>) | ||||
| 
 | ||||
|   if (COMPILER_IS_LIKE_GNU) | ||||
|     target_compile_options(${TARGET} PRIVATE | ||||
|       -std=c++17 | ||||
|       -fno-exceptions | ||||
|       -fno-rtti | ||||
|     ) | ||||
| 
 | ||||
|     if (${TINT_ENABLE_MSAN}) | ||||
|       target_compile_options(${TARGET} PRIVATE -fsanitize=memory) | ||||
|       target_link_options(${TARGET} PRIVATE -fsanitize=memory) | ||||
|     elseif (${TINT_ENABLE_ASAN}) | ||||
|       target_compile_options(${TARGET} PRIVATE -fsanitize=address) | ||||
|       target_link_options(${TARGET} PRIVATE -fsanitize=address) | ||||
|     elseif (${TINT_ENABLE_UBSAN}) | ||||
|       target_compile_options(${TARGET} PRIVATE -fsanitize=undefined) | ||||
|       target_link_options(${TARGET} PRIVATE -fsanitize=undefined) | ||||
|     endif() | ||||
|   endif(COMPILER_IS_LIKE_GNU) | ||||
| 
 | ||||
|   if (TINT_EMIT_COVERAGE) | ||||
|     if(CMAKE_CXX_COMPILER_ID MATCHES "GNU") | ||||
|         target_compile_options(${TARGET} PRIVATE "--coverage") | ||||
|         target_link_options(${TARGET} PRIVATE "gcov") | ||||
|     elseif(CMAKE_CXX_COMPILER_ID MATCHES "Clang") | ||||
|         target_compile_options(${TARGET} PRIVATE "-fprofile-instr-generate" "-fcoverage-mapping") | ||||
|         target_link_options(${TARGET} PRIVATE "-fprofile-instr-generate" "-fcoverage-mapping") | ||||
|     else() | ||||
|         message(FATAL_ERROR "Coverage generation not supported for the ${CMAKE_CXX_COMPILER_ID} toolchain") | ||||
|     endif() | ||||
|   endif(TINT_EMIT_COVERAGE) | ||||
| endfunction() | ||||
| 
 | ||||
| function(tint_default_compile_options TARGET) | ||||
|   tint_core_compile_options(${TARGET}) | ||||
| 
 | ||||
|   set(COMMON_GNU_OPTIONS | ||||
|     -Wall | ||||
| @ -299,11 +329,8 @@ function(tint_default_compile_options TARGET) | ||||
|     -Weverything | ||||
|   ) | ||||
| 
 | ||||
|   if (${COMPILER_IS_LIKE_GNU}) | ||||
|   if (COMPILER_IS_LIKE_GNU) | ||||
|     target_compile_options(${TARGET} PRIVATE | ||||
|       -std=c++17 | ||||
|       -fno-exceptions | ||||
|       -fno-rtti | ||||
|       -pedantic-errors | ||||
|       ${COMMON_GNU_OPTIONS} | ||||
|     ) | ||||
| @ -314,30 +341,7 @@ function(tint_default_compile_options TARGET) | ||||
|         ${COMMON_CLANG_OPTIONS} | ||||
|       ) | ||||
|     endif() | ||||
| 
 | ||||
|     if (${TINT_ENABLE_MSAN}) | ||||
|       target_compile_options(${TARGET} PRIVATE -fsanitize=memory) | ||||
|       target_link_options(${TARGET} PRIVATE -fsanitize=memory) | ||||
|     elseif (${TINT_ENABLE_ASAN}) | ||||
|       target_compile_options(${TARGET} PRIVATE -fsanitize=address) | ||||
|       target_link_options(${TARGET} PRIVATE -fsanitize=address) | ||||
|     elseif (${TINT_ENABLE_UBSAN}) | ||||
|       target_compile_options(${TARGET} PRIVATE -fsanitize=undefined) | ||||
|       target_link_options(${TARGET} PRIVATE -fsanitize=undefined) | ||||
|     endif() | ||||
|   endif() | ||||
| 
 | ||||
|   if (${TINT_EMIT_COVERAGE}) | ||||
|     if(CMAKE_CXX_COMPILER_ID MATCHES "GNU") | ||||
|         target_compile_options(${TARGET} PRIVATE "--coverage") | ||||
|         target_link_options(${TARGET} PRIVATE "gcov") | ||||
|     elseif(CMAKE_CXX_COMPILER_ID MATCHES "Clang") | ||||
|         target_compile_options(${TARGET} PRIVATE "-fprofile-instr-generate" "-fcoverage-mapping") | ||||
|         target_link_options(${TARGET} PRIVATE "-fprofile-instr-generate" "-fcoverage-mapping") | ||||
|     else() | ||||
|         message(FATAL_ERROR "Coverage generation not supported for the ${CMAKE_CXX_COMPILER_ID} toolchain") | ||||
|     endif() | ||||
|   endif() | ||||
|   endif(COMPILER_IS_LIKE_GNU) | ||||
| 
 | ||||
|   if (MSVC) | ||||
|     # Specify /EHs for exception handling. | ||||
| @ -379,7 +383,6 @@ function(tint_default_compile_options TARGET) | ||||
|       ) | ||||
|     endif() | ||||
|   endif() | ||||
| 
 | ||||
| endfunction() | ||||
| 
 | ||||
| add_subdirectory(third_party) | ||||
|  | ||||
							
								
								
									
										4
									
								
								DEPS
									
									
									
									
									
								
							
							
						
						
									
										4
									
								
								DEPS
									
									
									
									
									
								
							| @ -10,6 +10,7 @@ vars = { | ||||
|   'chromium_git':  'https://chromium.googlesource.com', | ||||
|   'github': '/external/github.com', | ||||
| 
 | ||||
|   'benchmark_revision': 'e991355c02b93fe17713efe04cbc2e278e00fdbd', | ||||
|   'build_revision': '555c8b467c21e2c4b22d00e87e3faa0431df9ac2', | ||||
|   'buildtools_revision': 'f78b4b9f33bd8ef9944d5ce643daff1c31880189', | ||||
|   'catapult_revision': 'fa35beefb3429605035f98211ddb8750dee6a13d', | ||||
| @ -101,6 +102,9 @@ deps = { | ||||
|   'third_party/catapult': Var('chromium_git') + '/catapult.git@' + | ||||
|       Var('catapult_revision'), | ||||
| 
 | ||||
|   'third_party/benchmark': Var('chromium_git') + Var('github') + | ||||
|       '/google/benchmark.git@' + Var('benchmark_revision'), | ||||
| 
 | ||||
|   'third_party/googletest': Var('chromium_git') + Var('github') + | ||||
|       '/google/googletest.git@' + Var('googletest_revision'), | ||||
| 
 | ||||
|  | ||||
| @ -56,13 +56,7 @@ bool ReadFile(const std::string& input_file, std::vector<T>* buffer) { | ||||
|   } | ||||
| 
 | ||||
|   fseek(file, 0, SEEK_END); | ||||
|   auto tell_file_size = ftell(file); | ||||
|   if (tell_file_size <= 0) { | ||||
|     std::cerr << "Input file of incorrect size: " << input_file << std::endl; | ||||
|     fclose(file); | ||||
|     return {}; | ||||
|   } | ||||
|   const auto file_size = static_cast<size_t>(tell_file_size); | ||||
|   const auto file_size = static_cast<size_t>(ftell(file)); | ||||
|   if (0 != (file_size % sizeof(T))) { | ||||
|     std::cerr << "File " << input_file | ||||
|               << " does not contain an integral number of objects: " | ||||
|  | ||||
| @ -84,7 +84,8 @@ if [ "$BUILD_SYSTEM" == "cmake" ]; then | ||||
| 
 | ||||
|     COMMON_CMAKE_FLAGS="" | ||||
|     COMMON_CMAKE_FLAGS+=" -DCMAKE_BUILD_TYPE=${BUILD_TYPE}" | ||||
|     COMMON_CMAKE_FLAGS+=" -DTINT_DOCS_WARN_AS_ERROR=ON" | ||||
|     COMMON_CMAKE_FLAGS+=" -DTINT_DOCS_WARN_AS_ERROR=1" | ||||
|     COMMON_CMAKE_FLAGS+=" -DTINT_BUILD_BENCHMARKS=1" | ||||
| 
 | ||||
|     if [ "$BUILD_TOOLCHAIN" == "clang" ]; then | ||||
|         using clang-10.0.0 | ||||
| @ -155,9 +156,9 @@ if [ "$BUILD_SYSTEM" == "cmake" ]; then | ||||
| 
 | ||||
|     status "Checking disabling all readers and writers also builds" | ||||
|     show_cmds | ||||
|         cmake ${SRC_DIR} ${CMAKE_FLAGS} ${COMMON_CMAKE_FLAGS} -DTINT_BUILD_SPV_READER=OFF -DTINT_BUILD_SPV_WRITER=OFF -DTINT_BUILD_WGSL_READER=OFF -DTINT_BUILD_WGSL_WRITER=OFF -DTINT_BUILD_MSL_WRITER=OFF -DTINT_BUILD_HLSL_WRITER=OFF | ||||
|         cmake ${SRC_DIR} ${CMAKE_FLAGS} ${COMMON_CMAKE_FLAGS} -DTINT_BUILD_SPV_READER=OFF -DTINT_BUILD_SPV_WRITER=OFF -DTINT_BUILD_WGSL_READER=OFF -DTINT_BUILD_WGSL_WRITER=OFF -DTINT_BUILD_MSL_WRITER=OFF -DTINT_BUILD_HLSL_WRITER=OFF -DTINT_BUILD_BENCHMARKS=OFF | ||||
|         cmake --build . -- --jobs=$(nproc) | ||||
|         cmake ${SRC_DIR} ${CMAKE_FLAGS} ${COMMON_CMAKE_FLAGS} -DTINT_BUILD_SPV_READER=ON -DTINT_BUILD_SPV_WRITER=ON -DTINT_BUILD_WGSL_READER=ON -DTINT_BUILD_WGSL_WRITER=ON -DTINT_BUILD_MSL_WRITER=ON -DTINT_BUILD_HLSL_WRITER=ON | ||||
|         cmake ${SRC_DIR} ${CMAKE_FLAGS} ${COMMON_CMAKE_FLAGS} -DTINT_BUILD_SPV_READER=ON -DTINT_BUILD_SPV_WRITER=ON -DTINT_BUILD_WGSL_READER=ON -DTINT_BUILD_WGSL_WRITER=ON -DTINT_BUILD_MSL_WRITER=ON -DTINT_BUILD_HLSL_WRITER=ON -DTINT_BUILD_BENCHMARKS=ON | ||||
|     hide_cmds | ||||
| else | ||||
|     status "Unsupported build system: $BUILD_SYSTEM" | ||||
|  | ||||
| @ -116,7 +116,7 @@ call :status "Configuring build system" | ||||
| @echo on | ||||
| mkdir %BUILD_DIR% | ||||
| cd /d %BUILD_DIR% | ||||
| set COMMON_CMAKE_FLAGS=-DTINT_BUILD_DOCS=O -DCMAKE_BUILD_TYPE=%BUILD_TYPE% | ||||
| set COMMON_CMAKE_FLAGS=-DTINT_BUILD_DOCS=O -DTINT_BUILD_BENCHMARKS=1 -DCMAKE_BUILD_TYPE=%BUILD_TYPE% | ||||
| @echo off | ||||
| 
 | ||||
| call :status "Building tint" | ||||
|  | ||||
| @ -437,13 +437,7 @@ bool ReadFile(const std::string& input_file, std::vector<T>* buffer) { | ||||
|   } | ||||
| 
 | ||||
|   fseek(file, 0, SEEK_END); | ||||
|   uint64_t tell_file_size = static_cast<uint64_t>(ftell(file)); | ||||
|   if (tell_file_size <= 0) { | ||||
|     std::cerr << "Input file of incorrect size: " << input_file << std::endl; | ||||
|     fclose(file); | ||||
|     return {}; | ||||
|   } | ||||
|   const auto file_size = static_cast<size_t>(tell_file_size); | ||||
|   const auto file_size = static_cast<size_t>(ftell(file)); | ||||
|   if (0 != (file_size % sizeof(T))) { | ||||
|     std::cerr << "File " << input_file | ||||
|               << " does not contain an integral number of objects: " | ||||
|  | ||||
| @ -598,7 +598,10 @@ if(${TINT_BUILD_SPV_READER} OR ${TINT_BUILD_SPV_WRITER}) | ||||
|   endif() | ||||
| endif() | ||||
| 
 | ||||
| if(${TINT_BUILD_TESTS}) | ||||
| ################################################################################ | ||||
| # Tests | ||||
| ################################################################################ | ||||
| if(TINT_BUILD_TESTS) | ||||
|   set(TINT_TEST_SRCS | ||||
|     ast/alias_test.cc | ||||
|     ast/array_test.cc | ||||
| @ -1114,6 +1117,7 @@ if(${TINT_BUILD_TESTS}) | ||||
|   endif() | ||||
| 
 | ||||
|   add_executable(tint_unittests ${TINT_TEST_SRCS}) | ||||
|   set_target_properties(${target} PROPERTIES FOLDER "Tests") | ||||
| 
 | ||||
|   if(NOT MSVC) | ||||
|     target_compile_options(tint_unittests PRIVATE | ||||
| @ -1133,4 +1137,41 @@ if(${TINT_BUILD_TESTS}) | ||||
|   endif() | ||||
| 
 | ||||
|   add_test(NAME tint_unittests COMMAND tint_unittests) | ||||
| endif() | ||||
| endif(TINT_BUILD_TESTS) | ||||
| 
 | ||||
| ################################################################################ | ||||
| # Benchmarks | ||||
| ################################################################################ | ||||
| if(TINT_BUILD_BENCHMARKS) | ||||
|   if(NOT TINT_BUILD_WGSL_READER) | ||||
|     message(FATAL_ERROR "TINT_BUILD_BENCHMARKS requires TINT_BUILD_WGSL_READER") | ||||
|   endif() | ||||
| 
 | ||||
|   set(TINT_BENCHMARK_SRC | ||||
|     "benchmark/benchmark.cc" | ||||
|     "reader/wgsl/parser_bench.cc" | ||||
|   ) | ||||
| 
 | ||||
|   if (${TINT_BUILD_GLSL_WRITER}) | ||||
|     list(APPEND TINT_BENCHMARK_SRC writer/glsl/generator_bench.cc) | ||||
|   endif() | ||||
|   if (${TINT_BUILD_HLSL_WRITER}) | ||||
|     list(APPEND TINT_BENCHMARK_SRC writer/hlsl/generator_bench.cc) | ||||
|   endif() | ||||
|   if (${TINT_BUILD_MSL_WRITER}) | ||||
|     list(APPEND TINT_BENCHMARK_SRC writer/msl/generator_bench.cc) | ||||
|   endif() | ||||
|   if (${TINT_BUILD_SPV_WRITER}) | ||||
|     list(APPEND TINT_BENCHMARK_SRC writer/spirv/generator_bench.cc) | ||||
|   endif() | ||||
|   if (${TINT_BUILD_WGSL_WRITER}) | ||||
|     list(APPEND TINT_BENCHMARK_SRC writer/wgsl/generator_bench.cc) | ||||
|   endif() | ||||
| 
 | ||||
|   add_executable(tint-benchmark ${TINT_BENCHMARK_SRC}) | ||||
|   set_target_properties(${target} PROPERTIES FOLDER "Benchmarks") | ||||
| 
 | ||||
|   tint_core_compile_options(tint-benchmark) | ||||
| 
 | ||||
|   target_link_libraries(tint-benchmark PRIVATE benchmark::benchmark libtint) | ||||
| endif(TINT_BUILD_BENCHMARKS) | ||||
|  | ||||
							
								
								
									
										123
									
								
								src/benchmark/benchmark.cc
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										123
									
								
								src/benchmark/benchmark.cc
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,123 @@ | ||||
| // Copyright 2022 The Tint Authors.
 | ||||
| //
 | ||||
| // Licensed under the Apache License, Version 2.0 (the "License");
 | ||||
| // you may not use this file except in compliance with the License.
 | ||||
| // You may obtain a copy of the License at
 | ||||
| //
 | ||||
| //     http://www.apache.org/licenses/LICENSE-2.0
 | ||||
| //
 | ||||
| // Unless required by applicable law or agreed to in writing, software
 | ||||
| // distributed under the License is distributed on an "AS IS" BASIS,
 | ||||
| // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 | ||||
| // See the License for the specific language governing permissions and
 | ||||
| // limitations under the License.
 | ||||
| 
 | ||||
| #include "src/benchmark/benchmark.h" | ||||
| 
 | ||||
| #include <filesystem> | ||||
| #include <sstream> | ||||
| #include <utility> | ||||
| #include <vector> | ||||
| 
 | ||||
| namespace tint::benchmark { | ||||
| namespace { | ||||
| 
 | ||||
| std::filesystem::path kInputFileDir; | ||||
| 
 | ||||
| /// Copies the content from the file named `input_file` to `buffer`,
 | ||||
| /// assuming each element in the file is of type `T`.  If any error occurs,
 | ||||
| /// writes error messages to the standard error stream and returns false.
 | ||||
| /// Assumes the size of a `T` object is divisible by its required alignment.
 | ||||
| /// @returns true if we successfully read the file.
 | ||||
| template <typename T> | ||||
| std::variant<std::vector<T>, Error> ReadFile(const std::string& input_file) { | ||||
|   FILE* file = nullptr; | ||||
| #if defined(_MSC_VER) | ||||
|   fopen_s(&file, input_file.c_str(), "rb"); | ||||
| #else | ||||
|   file = fopen(input_file.c_str(), "rb"); | ||||
| #endif | ||||
|   if (!file) { | ||||
|     return Error{"Failed to open " + input_file}; | ||||
|   } | ||||
| 
 | ||||
|   fseek(file, 0, SEEK_END); | ||||
|   const auto file_size = static_cast<size_t>(ftell(file)); | ||||
|   if (0 != (file_size % sizeof(T))) { | ||||
|     std::stringstream err; | ||||
|     err << "File " << input_file | ||||
|         << " does not contain an integral number of objects: " << file_size | ||||
|         << " bytes in the file, require " << sizeof(T) << " bytes per object"; | ||||
|     fclose(file); | ||||
|     return Error{err.str()}; | ||||
|   } | ||||
|   fseek(file, 0, SEEK_SET); | ||||
| 
 | ||||
|   std::vector<T> buffer; | ||||
|   buffer.resize(file_size / sizeof(T)); | ||||
| 
 | ||||
|   size_t bytes_read = fread(buffer.data(), 1, file_size, file); | ||||
|   fclose(file); | ||||
|   if (bytes_read != file_size) { | ||||
|     return Error{"Failed to read " + input_file}; | ||||
|   } | ||||
| 
 | ||||
|   return buffer; | ||||
| } | ||||
| 
 | ||||
| bool FindBenchmarkInputDir() { | ||||
|   // Attempt to find the benchmark input files by searching up from the current
 | ||||
|   // working directory.
 | ||||
|   auto path = std::filesystem::current_path(); | ||||
|   while (std::filesystem::is_directory(path)) { | ||||
|     auto test = path / "test" / "benchmark"; | ||||
|     if (std::filesystem::is_directory(test)) { | ||||
|       kInputFileDir = test; | ||||
|       return true; | ||||
|     } | ||||
|     auto parent = path.parent_path(); | ||||
|     if (path == parent) { | ||||
|       break; | ||||
|     } | ||||
|     path = parent; | ||||
|   } | ||||
|   return false; | ||||
| } | ||||
| 
 | ||||
| }  // namespace
 | ||||
| 
 | ||||
| std::variant<tint::Source::File, Error> LoadInputFile(std::string name) { | ||||
|   auto path = (kInputFileDir / name).string(); | ||||
|   auto data = ReadFile<uint8_t>(path); | ||||
|   if (auto* buf = std::get_if<std::vector<uint8_t>>(&data)) { | ||||
|     return tint::Source::File(path, std::string(buf->begin(), buf->end())); | ||||
|   } | ||||
|   return std::get<Error>(data); | ||||
| } | ||||
| 
 | ||||
| std::variant<ProgramAndFile, Error> LoadProgram(std::string name) { | ||||
|   auto res = benchmark::LoadInputFile(name); | ||||
|   if (auto err = std::get_if<benchmark::Error>(&res)) { | ||||
|     return *err; | ||||
|   } | ||||
|   auto& file = std::get<Source::File>(res); | ||||
|   auto program = reader::wgsl::Parse(&file); | ||||
|   if (program.Diagnostics().contains_errors()) { | ||||
|     return Error{program.Diagnostics().str()}; | ||||
|   } | ||||
|   return ProgramAndFile{std::move(program), std::move(file)}; | ||||
| } | ||||
| 
 | ||||
| }  // namespace tint::benchmark
 | ||||
| 
 | ||||
| int main(int argc, char** argv) { | ||||
|   ::benchmark::Initialize(&argc, argv); | ||||
|   if (::benchmark::ReportUnrecognizedArguments(argc, argv)) { | ||||
|     return 1; | ||||
|   } | ||||
|   if (!tint::benchmark::FindBenchmarkInputDir()) { | ||||
|     std::cerr << "failed to locate benchmark input files" << std::endl; | ||||
|     return 1; | ||||
|   } | ||||
|   ::benchmark::RunSpecifiedBenchmarks(); | ||||
| } | ||||
							
								
								
									
										69
									
								
								src/benchmark/benchmark.h
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										69
									
								
								src/benchmark/benchmark.h
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,69 @@ | ||||
| // Copyright 2022 The Tint Authors.
 | ||||
| //
 | ||||
| // Licensed under the Apache License, Version 2.0 (the "License");
 | ||||
| // you may not use this file except in compliance with the License.
 | ||||
| // You may obtain a copy of the License at
 | ||||
| //
 | ||||
| //     http://www.apache.org/licenses/LICENSE-2.0
 | ||||
| //
 | ||||
| // Unless required by applicable law or agreed to in writing, software
 | ||||
| // distributed under the License is distributed on an "AS IS" BASIS,
 | ||||
| // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 | ||||
| // See the License for the specific language governing permissions and
 | ||||
| // limitations under the License.
 | ||||
| 
 | ||||
| #ifndef SRC_BENCHMARK_BENCHMARK_H_ | ||||
| #define SRC_BENCHMARK_BENCHMARK_H_ | ||||
| 
 | ||||
| #include <memory> | ||||
| #include <string> | ||||
| #include <variant>  // NOLINT: Found C system header after C++ system header. | ||||
| 
 | ||||
| #include "benchmark/benchmark.h" | ||||
| #include "src/utils/concat.h" | ||||
| #include "tint/tint.h" | ||||
| 
 | ||||
| namespace tint::benchmark { | ||||
| 
 | ||||
| /// Error indicates an operation did not complete successfully.
 | ||||
| struct Error { | ||||
|   /// The error message.
 | ||||
|   std::string msg; | ||||
| }; | ||||
| 
 | ||||
| /// ProgramAndFile holds a Program and a Source::File.
 | ||||
| struct ProgramAndFile { | ||||
|   /// The tint program parsed from file.
 | ||||
|   Program program; | ||||
|   /// The source file
 | ||||
|   Source::File file; | ||||
| }; | ||||
| 
 | ||||
| /// LoadInputFile attempts to load a benchmark input file with the given file
 | ||||
| /// name.
 | ||||
| /// @param name the file name
 | ||||
| /// @returns either the loaded Source::File or an Error
 | ||||
| std::variant<Source::File, Error> LoadInputFile(std::string name); | ||||
| 
 | ||||
| /// LoadInputFile attempts to load a benchmark input program with the given file
 | ||||
| /// name.
 | ||||
| /// @param name the file name
 | ||||
| /// @returns either the loaded Program or an Error
 | ||||
| std::variant<ProgramAndFile, Error> LoadProgram(std::string name); | ||||
| 
 | ||||
| /// Declares a benchmark with the given function and WGSL file name
 | ||||
| #define TINT_BENCHMARK_WGSL_PROGRAM(FUNC, WGSL_NAME) \ | ||||
|   BENCHMARK_CAPTURE(FUNC, WGSL_NAME, WGSL_NAME); | ||||
| 
 | ||||
| /// Declares a set of benchmarks for the given function using a list of WGSL
 | ||||
| /// files in `<tint>/test/benchmark`.
 | ||||
| #define TINT_BENCHMARK_WGSL_PROGRAMS(FUNC)                   \ | ||||
|   TINT_BENCHMARK_WGSL_PROGRAM(FUNC, "empty.wgsl");           \ | ||||
|   TINT_BENCHMARK_WGSL_PROGRAM(FUNC, "particles.wgsl");       \ | ||||
|   TINT_BENCHMARK_WGSL_PROGRAM(FUNC, "simple_fragment.wgsl"); \ | ||||
|   TINT_BENCHMARK_WGSL_PROGRAM(FUNC, "simple_vertex.wgsl");   \ | ||||
|   TINT_BENCHMARK_WGSL_PROGRAM(FUNC, "simple_compute.wgsl"); | ||||
| 
 | ||||
| }  // namespace tint::benchmark
 | ||||
| 
 | ||||
| #endif  // SRC_BENCHMARK_BENCHMARK_H_
 | ||||
							
								
								
									
										40
									
								
								src/reader/wgsl/parser_bench.cc
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										40
									
								
								src/reader/wgsl/parser_bench.cc
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,40 @@ | ||||
| // Copyright 2022 The Tint Authors.
 | ||||
| //
 | ||||
| // Licensed under the Apache License, Version 2.0 (the "License");
 | ||||
| // you may not use this file except in compliance with the License.
 | ||||
| // You may obtain a copy of the License at
 | ||||
| //
 | ||||
| //     http://www.apache.org/licenses/LICENSE-2.0
 | ||||
| //
 | ||||
| // Unless required by applicable law or agreed to in writing, software
 | ||||
| // distributed under the License is distributed on an "AS IS" BASIS,
 | ||||
| // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 | ||||
| // See the License for the specific language governing permissions and
 | ||||
| // limitations under the License.
 | ||||
| 
 | ||||
| #include <string> | ||||
| 
 | ||||
| #include "src/benchmark/benchmark.h" | ||||
| 
 | ||||
| namespace tint::reader::wgsl { | ||||
| namespace { | ||||
| 
 | ||||
| void ParseWGSL(::benchmark::State& state, std::string input_name) { | ||||
|   auto res = benchmark::LoadInputFile(input_name); | ||||
|   if (auto err = std::get_if<benchmark::Error>(&res)) { | ||||
|     state.SkipWithError(err->msg.c_str()); | ||||
|     return; | ||||
|   } | ||||
|   auto& file = std::get<Source::File>(res); | ||||
|   for (auto _ : state) { | ||||
|     auto res = Parse(&file); | ||||
|     if (res.Diagnostics().contains_errors()) { | ||||
|       state.SkipWithError(res.Diagnostics().str().c_str()); | ||||
|     } | ||||
|   } | ||||
| } | ||||
| 
 | ||||
| TINT_BENCHMARK_WGSL_PROGRAMS(ParseWGSL); | ||||
| 
 | ||||
| }  // namespace
 | ||||
| }  // namespace tint::reader::wgsl
 | ||||
							
								
								
									
										50
									
								
								src/writer/glsl/generator_bench.cc
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										50
									
								
								src/writer/glsl/generator_bench.cc
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,50 @@ | ||||
| // Copyright 2022 The Tint Authors.
 | ||||
| //
 | ||||
| // Licensed under the Apache License, Version 2.0 (the "License");
 | ||||
| // you may not use this file except in compliance with the License.
 | ||||
| // You may obtain a copy of the License at
 | ||||
| //
 | ||||
| //     http://www.apache.org/licenses/LICENSE-2.0
 | ||||
| //
 | ||||
| // Unless required by applicable law or agreed to in writing, software
 | ||||
| // distributed under the License is distributed on an "AS IS" BASIS,
 | ||||
| // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 | ||||
| // See the License for the specific language governing permissions and
 | ||||
| // limitations under the License.
 | ||||
| 
 | ||||
| #include <string> | ||||
| 
 | ||||
| #include "src/ast/module.h" | ||||
| #include "src/benchmark/benchmark.h" | ||||
| 
 | ||||
| namespace tint::writer::glsl { | ||||
| namespace { | ||||
| 
 | ||||
| void GenerateGLSL(::benchmark::State& state, std::string input_name) { | ||||
|   auto res = benchmark::LoadProgram(input_name); | ||||
|   if (auto err = std::get_if<benchmark::Error>(&res)) { | ||||
|     state.SkipWithError(err->msg.c_str()); | ||||
|     return; | ||||
|   } | ||||
|   auto& program = std::get<benchmark::ProgramAndFile>(res).program; | ||||
|   std::vector<std::string> entry_points; | ||||
|   for (auto& fn : program.AST().Functions()) { | ||||
|     if (fn->IsEntryPoint()) { | ||||
|       entry_points.emplace_back(program.Symbols().NameFor(fn->symbol)); | ||||
|     } | ||||
|   } | ||||
| 
 | ||||
|   for (auto _ : state) { | ||||
|     for (auto& ep : entry_points) { | ||||
|       auto res = Generate(&program, {}, ep); | ||||
|       if (!res.error.empty()) { | ||||
|         state.SkipWithError(res.error.c_str()); | ||||
|       } | ||||
|     } | ||||
|   } | ||||
| } | ||||
| 
 | ||||
| TINT_BENCHMARK_WGSL_PROGRAMS(GenerateGLSL); | ||||
| 
 | ||||
| }  // namespace
 | ||||
| }  // namespace tint::writer::glsl
 | ||||
							
								
								
									
										40
									
								
								src/writer/hlsl/generator_bench.cc
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										40
									
								
								src/writer/hlsl/generator_bench.cc
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,40 @@ | ||||
| // Copyright 2022 The Tint Authors.
 | ||||
| //
 | ||||
| // Licensed under the Apache License, Version 2.0 (the "License");
 | ||||
| // you may not use this file except in compliance with the License.
 | ||||
| // You may obtain a copy of the License at
 | ||||
| //
 | ||||
| //     http://www.apache.org/licenses/LICENSE-2.0
 | ||||
| //
 | ||||
| // Unless required by applicable law or agreed to in writing, software
 | ||||
| // distributed under the License is distributed on an "AS IS" BASIS,
 | ||||
| // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 | ||||
| // See the License for the specific language governing permissions and
 | ||||
| // limitations under the License.
 | ||||
| 
 | ||||
| #include <string> | ||||
| 
 | ||||
| #include "src/benchmark/benchmark.h" | ||||
| 
 | ||||
| namespace tint::writer::hlsl { | ||||
| namespace { | ||||
| 
 | ||||
| void GenerateHLSL(::benchmark::State& state, std::string input_name) { | ||||
|   auto res = benchmark::LoadProgram(input_name); | ||||
|   if (auto err = std::get_if<benchmark::Error>(&res)) { | ||||
|     state.SkipWithError(err->msg.c_str()); | ||||
|     return; | ||||
|   } | ||||
|   auto& program = std::get<benchmark::ProgramAndFile>(res).program; | ||||
|   for (auto _ : state) { | ||||
|     auto res = Generate(&program, {}); | ||||
|     if (!res.error.empty()) { | ||||
|       state.SkipWithError(res.error.c_str()); | ||||
|     } | ||||
|   } | ||||
| } | ||||
| 
 | ||||
| TINT_BENCHMARK_WGSL_PROGRAMS(GenerateHLSL); | ||||
| 
 | ||||
| }  // namespace
 | ||||
| }  // namespace tint::writer::hlsl
 | ||||
							
								
								
									
										40
									
								
								src/writer/msl/generator_bench.cc
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										40
									
								
								src/writer/msl/generator_bench.cc
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,40 @@ | ||||
| // Copyright 2022 The Tint Authors.
 | ||||
| //
 | ||||
| // Licensed under the Apache License, Version 2.0 (the "License");
 | ||||
| // you may not use this file except in compliance with the License.
 | ||||
| // You may obtain a copy of the License at
 | ||||
| //
 | ||||
| //     http://www.apache.org/licenses/LICENSE-2.0
 | ||||
| //
 | ||||
| // Unless required by applicable law or agreed to in writing, software
 | ||||
| // distributed under the License is distributed on an "AS IS" BASIS,
 | ||||
| // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 | ||||
| // See the License for the specific language governing permissions and
 | ||||
| // limitations under the License.
 | ||||
| 
 | ||||
| #include <string> | ||||
| 
 | ||||
| #include "src/benchmark/benchmark.h" | ||||
| 
 | ||||
| namespace tint::writer::msl { | ||||
| namespace { | ||||
| 
 | ||||
| void GenerateMSL(::benchmark::State& state, std::string input_name) { | ||||
|   auto res = benchmark::LoadProgram(input_name); | ||||
|   if (auto err = std::get_if<benchmark::Error>(&res)) { | ||||
|     state.SkipWithError(err->msg.c_str()); | ||||
|     return; | ||||
|   } | ||||
|   auto& program = std::get<benchmark::ProgramAndFile>(res).program; | ||||
|   for (auto _ : state) { | ||||
|     auto res = Generate(&program, {}); | ||||
|     if (!res.error.empty()) { | ||||
|       state.SkipWithError(res.error.c_str()); | ||||
|     } | ||||
|   } | ||||
| } | ||||
| 
 | ||||
| TINT_BENCHMARK_WGSL_PROGRAMS(GenerateMSL); | ||||
| 
 | ||||
| }  // namespace
 | ||||
| }  // namespace tint::writer::msl
 | ||||
							
								
								
									
										40
									
								
								src/writer/spirv/generator_bench.cc
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										40
									
								
								src/writer/spirv/generator_bench.cc
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,40 @@ | ||||
| // Copyright 2022 The Tint Authors.
 | ||||
| //
 | ||||
| // Licensed under the Apache License, Version 2.0 (the "License");
 | ||||
| // you may not use this file except in compliance with the License.
 | ||||
| // You may obtain a copy of the License at
 | ||||
| //
 | ||||
| //     http://www.apache.org/licenses/LICENSE-2.0
 | ||||
| //
 | ||||
| // Unless required by applicable law or agreed to in writing, software
 | ||||
| // distributed under the License is distributed on an "AS IS" BASIS,
 | ||||
| // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 | ||||
| // See the License for the specific language governing permissions and
 | ||||
| // limitations under the License.
 | ||||
| 
 | ||||
| #include <string> | ||||
| 
 | ||||
| #include "src/benchmark/benchmark.h" | ||||
| 
 | ||||
| namespace tint::writer::spirv { | ||||
| namespace { | ||||
| 
 | ||||
| void GenerateSPIRV(::benchmark::State& state, std::string input_name) { | ||||
|   auto res = benchmark::LoadProgram(input_name); | ||||
|   if (auto err = std::get_if<benchmark::Error>(&res)) { | ||||
|     state.SkipWithError(err->msg.c_str()); | ||||
|     return; | ||||
|   } | ||||
|   auto& program = std::get<benchmark::ProgramAndFile>(res).program; | ||||
|   for (auto _ : state) { | ||||
|     auto res = Generate(&program, {}); | ||||
|     if (!res.error.empty()) { | ||||
|       state.SkipWithError(res.error.c_str()); | ||||
|     } | ||||
|   } | ||||
| } | ||||
| 
 | ||||
| TINT_BENCHMARK_WGSL_PROGRAMS(GenerateSPIRV); | ||||
| 
 | ||||
| }  // namespace
 | ||||
| }  // namespace tint::writer::spirv
 | ||||
							
								
								
									
										40
									
								
								src/writer/wgsl/generator_bench.cc
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										40
									
								
								src/writer/wgsl/generator_bench.cc
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,40 @@ | ||||
| // Copyright 2022 The Tint Authors.
 | ||||
| //
 | ||||
| // Licensed under the Apache License, Version 2.0 (the "License");
 | ||||
| // you may not use this file except in compliance with the License.
 | ||||
| // You may obtain a copy of the License at
 | ||||
| //
 | ||||
| //     http://www.apache.org/licenses/LICENSE-2.0
 | ||||
| //
 | ||||
| // Unless required by applicable law or agreed to in writing, software
 | ||||
| // distributed under the License is distributed on an "AS IS" BASIS,
 | ||||
| // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 | ||||
| // See the License for the specific language governing permissions and
 | ||||
| // limitations under the License.
 | ||||
| 
 | ||||
| #include <string> | ||||
| 
 | ||||
| #include "src/benchmark/benchmark.h" | ||||
| 
 | ||||
| namespace tint::writer::wgsl { | ||||
| namespace { | ||||
| 
 | ||||
| void GenerateWGSL(::benchmark::State& state, std::string input_name) { | ||||
|   auto res = benchmark::LoadProgram(input_name); | ||||
|   if (auto err = std::get_if<benchmark::Error>(&res)) { | ||||
|     state.SkipWithError(err->msg.c_str()); | ||||
|     return; | ||||
|   } | ||||
|   auto& program = std::get<benchmark::ProgramAndFile>(res).program; | ||||
|   for (auto _ : state) { | ||||
|     auto res = Generate(&program, {}); | ||||
|     if (!res.error.empty()) { | ||||
|       state.SkipWithError(res.error.c_str()); | ||||
|     } | ||||
|   } | ||||
| } | ||||
| 
 | ||||
| TINT_BENCHMARK_WGSL_PROGRAMS(GenerateWGSL); | ||||
| 
 | ||||
| }  // namespace
 | ||||
| }  // namespace tint::writer::wgsl
 | ||||
							
								
								
									
										0
									
								
								test/benchmark/empty.wgsl
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										0
									
								
								test/benchmark/empty.wgsl
									
									
									
									
									
										Normal file
									
								
							
							
								
								
									
										4
									
								
								test/benchmark/empty.wgsl.expected.hlsl
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										4
									
								
								test/benchmark/empty.wgsl.expected.hlsl
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,4 @@ | ||||
| [numthreads(1, 1, 1)] | ||||
| void unused_entry_point() { | ||||
|   return; | ||||
| } | ||||
							
								
								
									
										3
									
								
								test/benchmark/empty.wgsl.expected.msl
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										3
									
								
								test/benchmark/empty.wgsl.expected.msl
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,3 @@ | ||||
| #include <metal_stdlib> | ||||
| 
 | ||||
| using namespace metal; | ||||
							
								
								
									
										16
									
								
								test/benchmark/empty.wgsl.expected.spvasm
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										16
									
								
								test/benchmark/empty.wgsl.expected.spvasm
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,16 @@ | ||||
| ; SPIR-V | ||||
| ; Version: 1.3 | ||||
| ; Generator: Google Tint Compiler; 0 | ||||
| ; Bound: 5 | ||||
| ; Schema: 0 | ||||
|                OpCapability Shader | ||||
|                OpMemoryModel Logical GLSL450 | ||||
|                OpEntryPoint GLCompute %unused_entry_point "unused_entry_point" | ||||
|                OpExecutionMode %unused_entry_point LocalSize 1 1 1 | ||||
|                OpName %unused_entry_point "unused_entry_point" | ||||
|        %void = OpTypeVoid | ||||
|           %1 = OpTypeFunction %void | ||||
| %unused_entry_point = OpFunction %void None %1 | ||||
|           %4 = OpLabel | ||||
|                OpReturn | ||||
|                OpFunctionEnd | ||||
							
								
								
									
										0
									
								
								test/benchmark/empty.wgsl.expected.wgsl
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										0
									
								
								test/benchmark/empty.wgsl.expected.wgsl
									
									
									
									
									
										Normal file
									
								
							
							
								
								
									
										183
									
								
								test/benchmark/particles.wgsl
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										183
									
								
								test/benchmark/particles.wgsl
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,183 @@ | ||||
| //////////////////////////////////////////////////////////////////////////////// | ||||
| // Utilities | ||||
| //////////////////////////////////////////////////////////////////////////////// | ||||
| var<private> rand_seed : vec2<f32>; | ||||
| 
 | ||||
| fn rand() -> f32 { | ||||
|     rand_seed.x = fract(cos(dot(rand_seed, vec2<f32>(23.14077926, 232.61690225))) * 136.8168); | ||||
|     rand_seed.y = fract(cos(dot(rand_seed, vec2<f32>(54.47856553, 345.84153136))) * 534.7645); | ||||
|     return rand_seed.y; | ||||
| } | ||||
| 
 | ||||
| //////////////////////////////////////////////////////////////////////////////// | ||||
| // Vertex shader | ||||
| //////////////////////////////////////////////////////////////////////////////// | ||||
| struct RenderParams { | ||||
|   modelViewProjectionMatrix : mat4x4<f32>; | ||||
|   right : vec3<f32>; | ||||
|   up    : vec3<f32>; | ||||
| }; | ||||
| [[binding(0), group(0)]] var<uniform> render_params : RenderParams; | ||||
| 
 | ||||
| struct VertexInput { | ||||
|   [[location(0)]] position : vec3<f32>; | ||||
|   [[location(1)]] color    : vec4<f32>; | ||||
|   [[location(2)]] quad_pos : vec2<f32>; // -1..+1 | ||||
| }; | ||||
| 
 | ||||
| struct VertexOutput { | ||||
|   [[builtin(position)]] position : vec4<f32>; | ||||
|   [[location(0)]]       color    : vec4<f32>; | ||||
|   [[location(1)]]       quad_pos : vec2<f32>; // -1..+1 | ||||
| }; | ||||
| 
 | ||||
| [[stage(vertex)]] | ||||
| fn vs_main(in : VertexInput) -> VertexOutput { | ||||
|   var quad_pos = mat2x3<f32>(render_params.right, render_params.up) * in.quad_pos; | ||||
|   var position = in.position + quad_pos * 0.01; | ||||
|   var out : VertexOutput; | ||||
|   out.position = render_params.modelViewProjectionMatrix * vec4<f32>(position, 1.0); | ||||
|   out.color = in.color; | ||||
|   out.quad_pos = in.quad_pos; | ||||
|   return out; | ||||
| } | ||||
| 
 | ||||
| //////////////////////////////////////////////////////////////////////////////// | ||||
| // Fragment shader | ||||
| //////////////////////////////////////////////////////////////////////////////// | ||||
| [[stage(fragment)]] | ||||
| fn fs_main(in : VertexOutput) -> [[location(0)]] vec4<f32> { | ||||
|   var color = in.color; | ||||
|   // Apply a circular particle alpha mask | ||||
|   color.a = color.a * max(1.0 - length(in.quad_pos), 0.0); | ||||
|   return color; | ||||
| } | ||||
| 
 | ||||
| //////////////////////////////////////////////////////////////////////////////// | ||||
| // Simulation Compute shader | ||||
| //////////////////////////////////////////////////////////////////////////////// | ||||
| struct SimulationParams { | ||||
|   deltaTime : f32; | ||||
|   seed : vec4<f32>; | ||||
| }; | ||||
| 
 | ||||
| struct Particle { | ||||
|   position : vec3<f32>; | ||||
|   lifetime : f32; | ||||
|   color    : vec4<f32>; | ||||
|   velocity : vec3<f32>; | ||||
| }; | ||||
| 
 | ||||
| struct Particles { | ||||
|   particles : array<Particle>; | ||||
| }; | ||||
| 
 | ||||
| [[binding(0), group(0)]] var<uniform> sim_params : SimulationParams; | ||||
| [[binding(1), group(0)]] var<storage, read_write> data : Particles; | ||||
| [[binding(2), group(0)]] var texture : texture_2d<f32>; | ||||
| 
 | ||||
| [[stage(compute), workgroup_size(64)]] | ||||
| fn simulate([[builtin(global_invocation_id)]] GlobalInvocationID : vec3<u32>) { | ||||
|   rand_seed = (sim_params.seed.xy + vec2<f32>(GlobalInvocationID.xy)) * sim_params.seed.zw; | ||||
| 
 | ||||
|   let idx = GlobalInvocationID.x; | ||||
|   var particle = data.particles[idx]; | ||||
| 
 | ||||
|   // Apply gravity | ||||
|   particle.velocity.z = particle.velocity.z - sim_params.deltaTime * 0.5; | ||||
| 
 | ||||
|   // Basic velocity integration | ||||
|   particle.position = particle.position + sim_params.deltaTime * particle.velocity; | ||||
| 
 | ||||
|   // Age each particle. Fade out before vanishing. | ||||
|   particle.lifetime = particle.lifetime - sim_params.deltaTime; | ||||
|   particle.color.a = smoothStep(0.0, 0.5, particle.lifetime); | ||||
| 
 | ||||
|   // If the lifetime has gone negative, then the particle is dead and should be | ||||
|   // respawned. | ||||
|   if (particle.lifetime < 0.0) { | ||||
|     // Use the probability map to find where the particle should be spawned. | ||||
|     // Starting with the 1x1 mip level. | ||||
|     var coord = vec2<i32>(0, 0); | ||||
|     for (var level = textureNumLevels(texture) - 1; level > 0; level = level - 1) { | ||||
|       // Load the probability value from the mip-level | ||||
|       // Generate a random number and using the probabilty values, pick the | ||||
|       // next texel in the next largest mip level: | ||||
|       // | ||||
|       // 0.0    probabilites.r    probabilites.g    probabilites.b   1.0 | ||||
|       //  |              |              |              |              | | ||||
|       //  |   TOP-LEFT   |  TOP-RIGHT   | BOTTOM-LEFT  | BOTTOM_RIGHT | | ||||
|       // | ||||
|       let probabilites = textureLoad(texture, coord, level); | ||||
|       let value = vec4<f32>(rand()); | ||||
|       let mask = (value >= vec4<f32>(0.0, probabilites.xyz)) & (value < probabilites); | ||||
|       coord = coord * 2; | ||||
|       coord.x = coord.x + select(0, 1, any(mask.yw)); // x  y | ||||
|       coord.y = coord.y + select(0, 1, any(mask.zw)); // z  w | ||||
|     } | ||||
|     let uv = vec2<f32>(coord) / vec2<f32>(textureDimensions(texture)); | ||||
|     particle.position = vec3<f32>((uv - 0.5) * 3.0 * vec2<f32>(1.0, -1.0), 0.0); | ||||
|     particle.color = textureLoad(texture, coord, 0); | ||||
|     particle.velocity.x = (rand() - 0.5) * 0.1; | ||||
|     particle.velocity.y = (rand() - 0.5) * 0.1; | ||||
|     particle.velocity.z = rand() * 0.3; | ||||
|     particle.lifetime = 0.5 + rand() * 2.0; | ||||
|   } | ||||
| 
 | ||||
|   // Store the new particle value | ||||
|   data.particles[idx] = particle; | ||||
| } | ||||
| 
 | ||||
| struct UBO { | ||||
|   width : u32; | ||||
| }; | ||||
| 
 | ||||
| struct Buffer { | ||||
|   weights : array<f32>; | ||||
| }; | ||||
| 
 | ||||
| [[binding(3), group(0)]] var<uniform> ubo : UBO; | ||||
| [[binding(4), group(0)]] var<storage, read> buf_in : Buffer; | ||||
| [[binding(5), group(0)]] var<storage, read_write> buf_out : Buffer; | ||||
| [[binding(6), group(0)]] var tex_in : texture_2d<f32>; | ||||
| [[binding(7), group(0)]] var tex_out : texture_storage_2d<rgba8unorm, write>; | ||||
| 
 | ||||
| //////////////////////////////////////////////////////////////////////////////// | ||||
| // import_level | ||||
| // | ||||
| // Loads the alpha channel from a texel of the source image, and writes it to | ||||
| // the buf_out.weights. | ||||
| //////////////////////////////////////////////////////////////////////////////// | ||||
| [[stage(compute), workgroup_size(64)]] | ||||
| fn import_level([[builtin(global_invocation_id)]] coord : vec3<u32>) { | ||||
|   _ = &buf_in; | ||||
|   let offset = coord.x + coord.y * ubo.width; | ||||
|   buf_out.weights[offset] = textureLoad(tex_in, vec2<i32>(coord.xy), 0).w; | ||||
| } | ||||
| 
 | ||||
| //////////////////////////////////////////////////////////////////////////////// | ||||
| // export_level | ||||
| // | ||||
| // Loads 4 f32 weight values from buf_in.weights, and stores summed value into | ||||
| // buf_out.weights, along with the calculated 'probabilty' vec4 values into the | ||||
| // mip level of tex_out. See simulate() in particle.wgsl to understand the | ||||
| // probability logic. | ||||
| //////////////////////////////////////////////////////////////////////////////// | ||||
| [[stage(compute), workgroup_size(64)]] | ||||
| fn export_level([[builtin(global_invocation_id)]] coord : vec3<u32>) { | ||||
|   if (all(coord.xy < vec2<u32>(textureDimensions(tex_out)))) { | ||||
|     let dst_offset = coord.x    + coord.y    * ubo.width; | ||||
|     let src_offset = coord.x*2u + coord.y*2u * ubo.width; | ||||
| 
 | ||||
|     let a = buf_in.weights[src_offset + 0u]; | ||||
|     let b = buf_in.weights[src_offset + 1u]; | ||||
|     let c = buf_in.weights[src_offset + 0u + ubo.width]; | ||||
|     let d = buf_in.weights[src_offset + 1u + ubo.width]; | ||||
|     let sum = dot(vec4<f32>(a, b, c, d), vec4<f32>(1.0)); | ||||
| 
 | ||||
|     buf_out.weights[dst_offset] = sum / 4.0; | ||||
| 
 | ||||
|     let probabilities = vec4<f32>(a, a+b, a+b+c, sum) / max(sum, 0.0001); | ||||
|     textureStore(tex_out, vec2<i32>(coord.xy), probabilities); | ||||
|   } | ||||
| } | ||||
							
								
								
									
										204
									
								
								test/benchmark/particles.wgsl.expected.hlsl
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										204
									
								
								test/benchmark/particles.wgsl.expected.hlsl
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,204 @@ | ||||
| static float2 rand_seed = float2(0.0f, 0.0f); | ||||
| 
 | ||||
| float rand() { | ||||
|   rand_seed.x = frac((cos(dot(rand_seed, float2(23.140779495f, 232.616897583f))) * 136.816802979f)); | ||||
|   rand_seed.y = frac((cos(dot(rand_seed, float2(54.478565216f, 345.841522217f))) * 534.764526367f)); | ||||
|   return rand_seed.y; | ||||
| } | ||||
| 
 | ||||
| cbuffer cbuffer_render_params : register(b0, space0) { | ||||
|   uint4 render_params[6]; | ||||
| }; | ||||
| 
 | ||||
| struct VertexInput { | ||||
|   float3 position; | ||||
|   float4 color; | ||||
|   float2 quad_pos; | ||||
| }; | ||||
| struct VertexOutput { | ||||
|   float4 position; | ||||
|   float4 color; | ||||
|   float2 quad_pos; | ||||
| }; | ||||
| struct tint_symbol_5 { | ||||
|   float3 position : TEXCOORD0; | ||||
|   float4 color : TEXCOORD1; | ||||
|   float2 quad_pos : TEXCOORD2; | ||||
| }; | ||||
| struct tint_symbol_6 { | ||||
|   float4 color : TEXCOORD0; | ||||
|   float2 quad_pos : TEXCOORD1; | ||||
|   float4 position : SV_Position; | ||||
| }; | ||||
| 
 | ||||
| float4x4 tint_symbol_17(uint4 buffer[6], uint offset) { | ||||
|   const uint scalar_offset = ((offset + 0u)) / 4; | ||||
|   const uint scalar_offset_1 = ((offset + 16u)) / 4; | ||||
|   const uint scalar_offset_2 = ((offset + 32u)) / 4; | ||||
|   const uint scalar_offset_3 = ((offset + 48u)) / 4; | ||||
|   return float4x4(asfloat(buffer[scalar_offset / 4]), asfloat(buffer[scalar_offset_1 / 4]), asfloat(buffer[scalar_offset_2 / 4]), asfloat(buffer[scalar_offset_3 / 4])); | ||||
| } | ||||
| 
 | ||||
| VertexOutput vs_main_inner(VertexInput tint_symbol) { | ||||
|   float3 quad_pos = mul(tint_symbol.quad_pos, float2x3(asfloat(render_params[4].xyz), asfloat(render_params[5].xyz))); | ||||
|   float3 position = (tint_symbol.position + (quad_pos * 0.01f)); | ||||
|   VertexOutput tint_symbol_1 = (VertexOutput)0; | ||||
|   tint_symbol_1.position = mul(float4(position, 1.0f), tint_symbol_17(render_params, 0u)); | ||||
|   tint_symbol_1.color = tint_symbol.color; | ||||
|   tint_symbol_1.quad_pos = tint_symbol.quad_pos; | ||||
|   return tint_symbol_1; | ||||
| } | ||||
| 
 | ||||
| tint_symbol_6 vs_main(tint_symbol_5 tint_symbol_4) { | ||||
|   const VertexInput tint_symbol_32 = {tint_symbol_4.position, tint_symbol_4.color, tint_symbol_4.quad_pos}; | ||||
|   const VertexOutput inner_result = vs_main_inner(tint_symbol_32); | ||||
|   tint_symbol_6 wrapper_result = (tint_symbol_6)0; | ||||
|   wrapper_result.position = inner_result.position; | ||||
|   wrapper_result.color = inner_result.color; | ||||
|   wrapper_result.quad_pos = inner_result.quad_pos; | ||||
|   return wrapper_result; | ||||
| } | ||||
| 
 | ||||
| struct tint_symbol_8 { | ||||
|   float4 color : TEXCOORD0; | ||||
|   float2 quad_pos : TEXCOORD1; | ||||
|   float4 position : SV_Position; | ||||
| }; | ||||
| struct tint_symbol_9 { | ||||
|   float4 value : SV_Target0; | ||||
| }; | ||||
| 
 | ||||
| float4 fs_main_inner(VertexOutput tint_symbol) { | ||||
|   float4 color = tint_symbol.color; | ||||
|   color.a = (color.a * max((1.0f - length(tint_symbol.quad_pos)), 0.0f)); | ||||
|   return color; | ||||
| } | ||||
| 
 | ||||
| tint_symbol_9 fs_main(tint_symbol_8 tint_symbol_7) { | ||||
|   const VertexOutput tint_symbol_33 = {tint_symbol_7.position, tint_symbol_7.color, tint_symbol_7.quad_pos}; | ||||
|   const float4 inner_result_1 = fs_main_inner(tint_symbol_33); | ||||
|   tint_symbol_9 wrapper_result_1 = (tint_symbol_9)0; | ||||
|   wrapper_result_1.value = inner_result_1; | ||||
|   return wrapper_result_1; | ||||
| } | ||||
| 
 | ||||
| struct Particle { | ||||
|   float3 position; | ||||
|   float lifetime; | ||||
|   float4 color; | ||||
|   float3 velocity; | ||||
| }; | ||||
| 
 | ||||
| cbuffer cbuffer_sim_params : register(b0, space0) { | ||||
|   uint4 sim_params[2]; | ||||
| }; | ||||
| RWByteAddressBuffer data : register(u1, space0); | ||||
| Texture2D<float4> tint_symbol_2 : register(t2, space0); | ||||
| 
 | ||||
| struct tint_symbol_11 { | ||||
|   uint3 GlobalInvocationID : SV_DispatchThreadID; | ||||
| }; | ||||
| 
 | ||||
| Particle tint_symbol_20(RWByteAddressBuffer buffer, uint offset) { | ||||
|   const Particle tint_symbol_34 = {asfloat(buffer.Load3((offset + 0u))), asfloat(buffer.Load((offset + 12u))), asfloat(buffer.Load4((offset + 16u))), asfloat(buffer.Load3((offset + 32u)))}; | ||||
|   return tint_symbol_34; | ||||
| } | ||||
| 
 | ||||
| void tint_symbol_25(RWByteAddressBuffer buffer, uint offset, Particle value) { | ||||
|   buffer.Store3((offset + 0u), asuint(value.position)); | ||||
|   buffer.Store((offset + 12u), asuint(value.lifetime)); | ||||
|   buffer.Store4((offset + 16u), asuint(value.color)); | ||||
|   buffer.Store3((offset + 32u), asuint(value.velocity)); | ||||
| } | ||||
| 
 | ||||
| void simulate_inner(uint3 GlobalInvocationID) { | ||||
|   rand_seed = ((asfloat(sim_params[1]).xy + float2(GlobalInvocationID.xy)) * asfloat(sim_params[1]).zw); | ||||
|   const uint idx = GlobalInvocationID.x; | ||||
|   Particle particle = tint_symbol_20(data, (48u * idx)); | ||||
|   particle.velocity.z = (particle.velocity.z - (asfloat(sim_params[0].x) * 0.5f)); | ||||
|   particle.position = (particle.position + (asfloat(sim_params[0].x) * particle.velocity)); | ||||
|   particle.lifetime = (particle.lifetime - asfloat(sim_params[0].x)); | ||||
|   particle.color.a = smoothstep(0.0f, 0.5f, particle.lifetime); | ||||
|   if ((particle.lifetime < 0.0f)) { | ||||
|     int2 coord = int2(0, 0); | ||||
|     { | ||||
|       int3 tint_tmp; | ||||
|       tint_symbol_2.GetDimensions(0, tint_tmp.x, tint_tmp.y, tint_tmp.z); | ||||
|       int level = (tint_tmp.z - 1); | ||||
|       [loop] for(; (level > 0); level = (level - 1)) { | ||||
|         const float4 probabilites = tint_symbol_2.Load(int3(coord, level)); | ||||
|         const float4 value = float4((rand()).xxxx); | ||||
|         const bool4 mask = ((value >= float4(0.0f, probabilites.xyz)) & (value < probabilites)); | ||||
|         coord = (coord * 2); | ||||
|         coord.x = (coord.x + (any(mask.yw) ? 1 : 0)); | ||||
|         coord.y = (coord.y + (any(mask.zw) ? 1 : 0)); | ||||
|       } | ||||
|     } | ||||
|     int2 tint_tmp_1; | ||||
|     tint_symbol_2.GetDimensions(tint_tmp_1.x, tint_tmp_1.y); | ||||
|     const float2 uv = (float2(coord) / float2(tint_tmp_1)); | ||||
|     particle.position = float3((((uv - 0.5f) * 3.0f) * float2(1.0f, -1.0f)), 0.0f); | ||||
|     particle.color = tint_symbol_2.Load(int3(coord, 0)); | ||||
|     particle.velocity.x = ((rand() - 0.5f) * 0.100000001f); | ||||
|     particle.velocity.y = ((rand() - 0.5f) * 0.100000001f); | ||||
|     particle.velocity.z = (rand() * 0.300000012f); | ||||
|     particle.lifetime = (0.5f + (rand() * 2.0f)); | ||||
|   } | ||||
|   tint_symbol_25(data, (48u * idx), particle); | ||||
| } | ||||
| 
 | ||||
| [numthreads(64, 1, 1)] | ||||
| void simulate(tint_symbol_11 tint_symbol_10) { | ||||
|   simulate_inner(tint_symbol_10.GlobalInvocationID); | ||||
|   return; | ||||
| } | ||||
| 
 | ||||
| cbuffer cbuffer_ubo : register(b3, space0) { | ||||
|   uint4 ubo[1]; | ||||
| }; | ||||
| ByteAddressBuffer buf_in : register(t4, space0); | ||||
| RWByteAddressBuffer buf_out : register(u5, space0); | ||||
| Texture2D<float4> tex_in : register(t6, space0); | ||||
| RWTexture2D<float4> tex_out : register(u7, space0); | ||||
| 
 | ||||
| struct tint_symbol_13 { | ||||
|   uint3 coord : SV_DispatchThreadID; | ||||
| }; | ||||
| 
 | ||||
| void import_level_inner(uint3 coord) { | ||||
|   const uint offset = (coord.x + (coord.y * ubo[0].x)); | ||||
|   buf_out.Store((4u * offset), asuint(tex_in.Load(int3(int2(coord.xy), 0)).w)); | ||||
| } | ||||
| 
 | ||||
| [numthreads(64, 1, 1)] | ||||
| void import_level(tint_symbol_13 tint_symbol_12) { | ||||
|   import_level_inner(tint_symbol_12.coord); | ||||
|   return; | ||||
| } | ||||
| 
 | ||||
| struct tint_symbol_15 { | ||||
|   uint3 coord : SV_DispatchThreadID; | ||||
| }; | ||||
| 
 | ||||
| void export_level_inner(uint3 coord) { | ||||
|   int2 tint_tmp_2; | ||||
|   tex_out.GetDimensions(tint_tmp_2.x, tint_tmp_2.y); | ||||
|   if (all((coord.xy < uint2(tint_tmp_2)))) { | ||||
|     const uint dst_offset = (coord.x + (coord.y * ubo[0].x)); | ||||
|     const uint src_offset = ((coord.x * 2u) + ((coord.y * 2u) * ubo[0].x)); | ||||
|     const float a_1 = asfloat(buf_in.Load((4u * (src_offset + 0u)))); | ||||
|     const float b = asfloat(buf_in.Load((4u * (src_offset + 1u)))); | ||||
|     const float c = asfloat(buf_in.Load((4u * ((src_offset + 0u) + ubo[0].x)))); | ||||
|     const float d = asfloat(buf_in.Load((4u * ((src_offset + 1u) + ubo[0].x)))); | ||||
|     const float sum = dot(float4(a_1, b, c, d), float4((1.0f).xxxx)); | ||||
|     buf_out.Store((4u * dst_offset), asuint((sum / 4.0f))); | ||||
|     const float4 probabilities = (float4(a_1, (a_1 + b), ((a_1 + b) + c), sum) / max(sum, 0.0001f)); | ||||
|     tex_out[int2(coord.xy)] = probabilities; | ||||
|   } | ||||
| } | ||||
| 
 | ||||
| [numthreads(64, 1, 1)] | ||||
| void export_level(tint_symbol_15 tint_symbol_14) { | ||||
|   export_level_inner(tint_symbol_14.coord); | ||||
|   return; | ||||
| } | ||||
							
								
								
									
										175
									
								
								test/benchmark/particles.wgsl.expected.msl
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										175
									
								
								test/benchmark/particles.wgsl.expected.msl
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,175 @@ | ||||
| #include <metal_stdlib> | ||||
| 
 | ||||
| using namespace metal; | ||||
| 
 | ||||
| template<typename T, int N, int M> | ||||
| inline vec<T, M> operator*(matrix<T, N, M> lhs, packed_vec<T, N> rhs) { | ||||
|   return lhs * vec<T, N>(rhs); | ||||
| } | ||||
| 
 | ||||
| template<typename T, int N, int M> | ||||
| inline vec<T, N> operator*(packed_vec<T, M> lhs, matrix<T, N, M> rhs) { | ||||
|   return vec<T, M>(lhs) * rhs; | ||||
| } | ||||
| 
 | ||||
| struct RenderParams { | ||||
|   /* 0x0000 */ float4x4 modelViewProjectionMatrix; | ||||
|   /* 0x0040 */ packed_float3 right; | ||||
|   /* 0x004c */ int8_t tint_pad[4]; | ||||
|   /* 0x0050 */ packed_float3 up; | ||||
|   /* 0x005c */ int8_t tint_pad_1[4]; | ||||
| }; | ||||
| struct VertexInput { | ||||
|   float3 position; | ||||
|   float4 color; | ||||
|   float2 quad_pos; | ||||
| }; | ||||
| struct VertexOutput { | ||||
|   float4 position; | ||||
|   float4 color; | ||||
|   float2 quad_pos; | ||||
| }; | ||||
| struct tint_symbol_2 { | ||||
|   float3 position [[attribute(0)]]; | ||||
|   float4 color [[attribute(1)]]; | ||||
|   float2 quad_pos [[attribute(2)]]; | ||||
| }; | ||||
| struct tint_symbol_3 { | ||||
|   float4 color [[user(locn0)]]; | ||||
|   float2 quad_pos [[user(locn1)]]; | ||||
|   float4 position [[position]]; | ||||
| }; | ||||
| struct tint_symbol_5 { | ||||
|   float4 color [[user(locn0)]]; | ||||
|   float2 quad_pos [[user(locn1)]]; | ||||
| }; | ||||
| struct tint_symbol_6 { | ||||
|   float4 value [[color(0)]]; | ||||
| }; | ||||
| struct SimulationParams { | ||||
|   /* 0x0000 */ float deltaTime; | ||||
|   /* 0x0004 */ int8_t tint_pad_2[12]; | ||||
|   /* 0x0010 */ float4 seed; | ||||
| }; | ||||
| struct Particle { | ||||
|   /* 0x0000 */ packed_float3 position; | ||||
|   /* 0x000c */ float lifetime; | ||||
|   /* 0x0010 */ float4 color; | ||||
|   /* 0x0020 */ packed_float3 velocity; | ||||
|   /* 0x002c */ int8_t tint_pad_3[4]; | ||||
| }; | ||||
| struct Particles { | ||||
|   /* 0x0000 */ Particle particles[1]; | ||||
| }; | ||||
| struct UBO { | ||||
|   /* 0x0000 */ uint width; | ||||
| }; | ||||
| struct Buffer { | ||||
|   /* 0x0000 */ float weights[1]; | ||||
| }; | ||||
| 
 | ||||
| float rand(thread float2* const tint_symbol_9) { | ||||
|   (*(tint_symbol_9))[0] = fract((cos(dot(*(tint_symbol_9), float2(23.140779495f, 232.616897583f))) * 136.816802979f)); | ||||
|   (*(tint_symbol_9))[1] = fract((cos(dot(*(tint_symbol_9), float2(54.478565216f, 345.841522217f))) * 534.764526367f)); | ||||
|   return (*(tint_symbol_9))[1]; | ||||
| } | ||||
| 
 | ||||
| VertexOutput vs_main_inner(VertexInput in, const constant RenderParams* const tint_symbol_10) { | ||||
|   float3 quad_pos = (float2x3((*(tint_symbol_10)).right, (*(tint_symbol_10)).up) * in.quad_pos); | ||||
|   float3 position = (in.position + (quad_pos * 0.01f)); | ||||
|   VertexOutput out = {}; | ||||
|   out.position = ((*(tint_symbol_10)).modelViewProjectionMatrix * float4(position, 1.0f)); | ||||
|   out.color = in.color; | ||||
|   out.quad_pos = in.quad_pos; | ||||
|   return out; | ||||
| } | ||||
| 
 | ||||
| vertex tint_symbol_3 vs_main(const constant RenderParams* tint_symbol_11 [[buffer(0)]], tint_symbol_2 tint_symbol_1 [[stage_in]]) { | ||||
|   VertexInput const tint_symbol_7 = {.position=tint_symbol_1.position, .color=tint_symbol_1.color, .quad_pos=tint_symbol_1.quad_pos}; | ||||
|   VertexOutput const inner_result = vs_main_inner(tint_symbol_7, tint_symbol_11); | ||||
|   tint_symbol_3 wrapper_result = {}; | ||||
|   wrapper_result.position = inner_result.position; | ||||
|   wrapper_result.color = inner_result.color; | ||||
|   wrapper_result.quad_pos = inner_result.quad_pos; | ||||
|   return wrapper_result; | ||||
| } | ||||
| 
 | ||||
| float4 fs_main_inner(VertexOutput in) { | ||||
|   float4 color = in.color; | ||||
|   color[3] = (color[3] * fmax((1.0f - length(in.quad_pos)), 0.0f)); | ||||
|   return color; | ||||
| } | ||||
| 
 | ||||
| fragment tint_symbol_6 fs_main(float4 position [[position]], tint_symbol_5 tint_symbol_4 [[stage_in]]) { | ||||
|   VertexOutput const tint_symbol_8 = {.position=position, .color=tint_symbol_4.color, .quad_pos=tint_symbol_4.quad_pos}; | ||||
|   float4 const inner_result_1 = fs_main_inner(tint_symbol_8); | ||||
|   tint_symbol_6 wrapper_result_1 = {}; | ||||
|   wrapper_result_1.value = inner_result_1; | ||||
|   return wrapper_result_1; | ||||
| } | ||||
| 
 | ||||
| void simulate_inner(uint3 GlobalInvocationID, thread float2* const tint_symbol_12, const constant SimulationParams* const tint_symbol_13, device Particles* const tint_symbol_14, texture2d<float, access::sample> tint_symbol_15) { | ||||
|   *(tint_symbol_12) = ((float4((*(tint_symbol_13)).seed).xy + float2(uint3(GlobalInvocationID).xy)) * float4((*(tint_symbol_13)).seed).zw); | ||||
|   uint const idx = GlobalInvocationID[0]; | ||||
|   Particle particle = (*(tint_symbol_14)).particles[idx]; | ||||
|   particle.velocity[2] = (particle.velocity[2] - ((*(tint_symbol_13)).deltaTime * 0.5f)); | ||||
|   particle.position = (particle.position + ((*(tint_symbol_13)).deltaTime * particle.velocity)); | ||||
|   particle.lifetime = (particle.lifetime - (*(tint_symbol_13)).deltaTime); | ||||
|   particle.color[3] = smoothstep(0.0f, 0.5f, particle.lifetime); | ||||
|   if ((particle.lifetime < 0.0f)) { | ||||
|     int2 coord = int2(0, 0); | ||||
|     for(int level = as_type<int>((as_type<uint>(int(tint_symbol_15.get_num_mip_levels())) - as_type<uint>(1))); (level > 0); level = as_type<int>((as_type<uint>(level) - as_type<uint>(1)))) { | ||||
|       float4 const probabilites = tint_symbol_15.read(uint2(coord), level); | ||||
|       float4 const value = float4(rand(tint_symbol_12)); | ||||
|       bool4 const mask = ((value >= float4(0.0f, float4(probabilites).xyz)) & (value < probabilites)); | ||||
|       coord = as_type<int2>((as_type<uint2>(coord) * as_type<uint>(2))); | ||||
|       coord[0] = as_type<int>((as_type<uint>(coord[0]) + as_type<uint>(select(0, 1, any(bool4(mask).yw))))); | ||||
|       coord[1] = as_type<int>((as_type<uint>(coord[1]) + as_type<uint>(select(0, 1, any(bool4(mask).zw))))); | ||||
|     } | ||||
|     float2 const uv = (float2(coord) / float2(int2(tint_symbol_15.get_width(), tint_symbol_15.get_height()))); | ||||
|     particle.position = float3((((uv - 0.5f) * 3.0f) * float2(1.0f, -1.0f)), 0.0f); | ||||
|     particle.color = tint_symbol_15.read(uint2(coord), 0); | ||||
|     particle.velocity[0] = ((rand(tint_symbol_12) - 0.5f) * 0.100000001f); | ||||
|     particle.velocity[1] = ((rand(tint_symbol_12) - 0.5f) * 0.100000001f); | ||||
|     particle.velocity[2] = (rand(tint_symbol_12) * 0.300000012f); | ||||
|     particle.lifetime = (0.5f + (rand(tint_symbol_12) * 2.0f)); | ||||
|   } | ||||
|   (*(tint_symbol_14)).particles[idx] = particle; | ||||
| } | ||||
| 
 | ||||
| kernel void simulate(const constant SimulationParams* tint_symbol_17 [[buffer(0)]], device Particles* tint_symbol_18 [[buffer(1)]], texture2d<float, access::sample> tint_symbol_19 [[texture(0)]], uint3 GlobalInvocationID [[thread_position_in_grid]]) { | ||||
|   thread float2 tint_symbol_16 = 0.0f; | ||||
|   simulate_inner(GlobalInvocationID, &(tint_symbol_16), tint_symbol_17, tint_symbol_18, tint_symbol_19); | ||||
|   return; | ||||
| } | ||||
| 
 | ||||
| void import_level_inner(uint3 coord, const constant UBO* const tint_symbol_20, device Buffer* const tint_symbol_21, texture2d<float, access::sample> tint_symbol_22) { | ||||
|   uint const offset = (coord[0] + (coord[1] * (*(tint_symbol_20)).width)); | ||||
|   (*(tint_symbol_21)).weights[offset] = tint_symbol_22.read(uint2(int2(uint3(coord).xy)), 0)[3]; | ||||
| } | ||||
| 
 | ||||
| kernel void import_level(const constant UBO* tint_symbol_23 [[buffer(2)]], device Buffer* tint_symbol_24 [[buffer(3)]], texture2d<float, access::sample> tint_symbol_25 [[texture(1)]], uint3 coord [[thread_position_in_grid]]) { | ||||
|   import_level_inner(coord, tint_symbol_23, tint_symbol_24, tint_symbol_25); | ||||
|   return; | ||||
| } | ||||
| 
 | ||||
| void export_level_inner(uint3 coord, texture2d<float, access::write> tint_symbol_26, const constant UBO* const tint_symbol_27, const device Buffer* const tint_symbol_28, device Buffer* const tint_symbol_29) { | ||||
|   if (all((uint3(coord).xy < uint2(int2(tint_symbol_26.get_width(), tint_symbol_26.get_height()))))) { | ||||
|     uint const dst_offset = (coord[0] + (coord[1] * (*(tint_symbol_27)).width)); | ||||
|     uint const src_offset = ((coord[0] * 2u) + ((coord[1] * 2u) * (*(tint_symbol_27)).width)); | ||||
|     float const a_1 = (*(tint_symbol_28)).weights[(src_offset + 0u)]; | ||||
|     float const b = (*(tint_symbol_28)).weights[(src_offset + 1u)]; | ||||
|     float const c = (*(tint_symbol_28)).weights[((src_offset + 0u) + (*(tint_symbol_27)).width)]; | ||||
|     float const d = (*(tint_symbol_28)).weights[((src_offset + 1u) + (*(tint_symbol_27)).width)]; | ||||
|     float const sum = dot(float4(a_1, b, c, d), float4(1.0f)); | ||||
|     (*(tint_symbol_29)).weights[dst_offset] = (sum / 4.0f); | ||||
|     float4 const probabilities = (float4(a_1, (a_1 + b), ((a_1 + b) + c), sum) / fmax(sum, 0.0001f)); | ||||
|     tint_symbol_26.write(probabilities, uint2(int2(uint3(coord).xy))); | ||||
|   } | ||||
| } | ||||
| 
 | ||||
| kernel void export_level(texture2d<float, access::write> tint_symbol_30 [[texture(2)]], const constant UBO* tint_symbol_31 [[buffer(2)]], const device Buffer* tint_symbol_32 [[buffer(4)]], device Buffer* tint_symbol_33 [[buffer(3)]], uint3 coord [[thread_position_in_grid]]) { | ||||
|   export_level_inner(coord, tint_symbol_30, tint_symbol_31, tint_symbol_32, tint_symbol_33); | ||||
|   return; | ||||
| } | ||||
| 
 | ||||
							
								
								
									
										646
									
								
								test/benchmark/particles.wgsl.expected.spvasm
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										646
									
								
								test/benchmark/particles.wgsl.expected.spvasm
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,646 @@ | ||||
| ; SPIR-V | ||||
| ; Version: 1.3 | ||||
| ; Generator: Google Tint Compiler; 0 | ||||
| ; Bound: 423 | ||||
| ; Schema: 0 | ||||
|                OpCapability Shader | ||||
|                OpCapability ImageQuery | ||||
|          %67 = OpExtInstImport "GLSL.std.450" | ||||
|                OpMemoryModel Logical GLSL450 | ||||
|                OpEntryPoint Vertex %vs_main "vs_main" %position_1 %color_1 %quad_pos_1 %position_2 %color_2 %quad_pos_2 %vertex_point_size | ||||
|                OpEntryPoint Fragment %fs_main "fs_main" %position_3 %color_3 %quad_pos_3 %value_1 | ||||
|                OpEntryPoint GLCompute %simulate "simulate" %GlobalInvocationID_1 | ||||
|                OpEntryPoint GLCompute %import_level "import_level" %coord_1 | ||||
|                OpEntryPoint GLCompute %export_level "export_level" %coord_2 | ||||
|                OpExecutionMode %fs_main OriginUpperLeft | ||||
|                OpExecutionMode %simulate LocalSize 64 1 1 | ||||
|                OpExecutionMode %import_level LocalSize 64 1 1 | ||||
|                OpExecutionMode %export_level LocalSize 64 1 1 | ||||
|                OpName %position_1 "position_1" | ||||
|                OpName %color_1 "color_1" | ||||
|                OpName %quad_pos_1 "quad_pos_1" | ||||
|                OpName %position_2 "position_2" | ||||
|                OpName %color_2 "color_2" | ||||
|                OpName %quad_pos_2 "quad_pos_2" | ||||
|                OpName %vertex_point_size "vertex_point_size" | ||||
|                OpName %position_3 "position_3" | ||||
|                OpName %color_3 "color_3" | ||||
|                OpName %quad_pos_3 "quad_pos_3" | ||||
|                OpName %value_1 "value_1" | ||||
|                OpName %GlobalInvocationID_1 "GlobalInvocationID_1" | ||||
|                OpName %coord_1 "coord_1" | ||||
|                OpName %coord_2 "coord_2" | ||||
|                OpName %rand_seed "rand_seed" | ||||
|                OpName %RenderParams "RenderParams" | ||||
|                OpMemberName %RenderParams 0 "modelViewProjectionMatrix" | ||||
|                OpMemberName %RenderParams 1 "right" | ||||
|                OpMemberName %RenderParams 2 "up" | ||||
|                OpName %render_params "render_params" | ||||
|                OpName %SimulationParams "SimulationParams" | ||||
|                OpMemberName %SimulationParams 0 "deltaTime" | ||||
|                OpMemberName %SimulationParams 1 "seed" | ||||
|                OpName %sim_params "sim_params" | ||||
|                OpName %Particles "Particles" | ||||
|                OpMemberName %Particles 0 "particles" | ||||
|                OpName %Particle "Particle" | ||||
|                OpMemberName %Particle 0 "position" | ||||
|                OpMemberName %Particle 1 "lifetime" | ||||
|                OpMemberName %Particle 2 "color" | ||||
|                OpMemberName %Particle 3 "velocity" | ||||
|                OpName %data "data" | ||||
|                OpName %texture "texture" | ||||
|                OpName %UBO "UBO" | ||||
|                OpMemberName %UBO 0 "width" | ||||
|                OpName %ubo "ubo" | ||||
|                OpName %Buffer "Buffer" | ||||
|                OpMemberName %Buffer 0 "weights" | ||||
|                OpName %buf_in "buf_in" | ||||
|                OpName %buf_out "buf_out" | ||||
|                OpName %tex_in "tex_in" | ||||
|                OpName %tex_out "tex_out" | ||||
|                OpName %rand "rand" | ||||
|                OpName %VertexOutput "VertexOutput" | ||||
|                OpMemberName %VertexOutput 0 "position" | ||||
|                OpMemberName %VertexOutput 1 "color" | ||||
|                OpMemberName %VertexOutput 2 "quad_pos" | ||||
|                OpName %VertexInput "VertexInput" | ||||
|                OpMemberName %VertexInput 0 "position" | ||||
|                OpMemberName %VertexInput 1 "color" | ||||
|                OpMemberName %VertexInput 2 "quad_pos" | ||||
|                OpName %vs_main_inner "vs_main_inner" | ||||
|                OpName %in "in" | ||||
|                OpName %quad_pos "quad_pos" | ||||
|                OpName %position "position" | ||||
|                OpName %out "out" | ||||
|                OpName %vs_main "vs_main" | ||||
|                OpName %fs_main_inner "fs_main_inner" | ||||
|                OpName %in_0 "in" | ||||
|                OpName %color "color" | ||||
|                OpName %fs_main "fs_main" | ||||
|                OpName %simulate_inner "simulate_inner" | ||||
|                OpName %GlobalInvocationID "GlobalInvocationID" | ||||
|                OpName %particle "particle" | ||||
|                OpName %coord "coord" | ||||
|                OpName %level "level" | ||||
|                OpName %simulate "simulate" | ||||
|                OpName %import_level_inner "import_level_inner" | ||||
|                OpName %coord_0 "coord" | ||||
|                OpName %import_level "import_level" | ||||
|                OpName %export_level_inner "export_level_inner" | ||||
|                OpName %coord_3 "coord" | ||||
|                OpName %export_level "export_level" | ||||
|                OpDecorate %position_1 Location 0 | ||||
|                OpDecorate %color_1 Location 1 | ||||
|                OpDecorate %quad_pos_1 Location 2 | ||||
|                OpDecorate %position_2 BuiltIn Position | ||||
|                OpDecorate %color_2 Location 0 | ||||
|                OpDecorate %quad_pos_2 Location 1 | ||||
|                OpDecorate %vertex_point_size BuiltIn PointSize | ||||
|                OpDecorate %position_3 BuiltIn FragCoord | ||||
|                OpDecorate %color_3 Location 0 | ||||
|                OpDecorate %quad_pos_3 Location 1 | ||||
|                OpDecorate %value_1 Location 0 | ||||
|                OpDecorate %GlobalInvocationID_1 BuiltIn GlobalInvocationId | ||||
|                OpDecorate %coord_1 BuiltIn GlobalInvocationId | ||||
|                OpDecorate %coord_2 BuiltIn GlobalInvocationId | ||||
|                OpDecorate %RenderParams Block | ||||
|                OpMemberDecorate %RenderParams 0 Offset 0 | ||||
|                OpMemberDecorate %RenderParams 0 ColMajor | ||||
|                OpMemberDecorate %RenderParams 0 MatrixStride 16 | ||||
|                OpMemberDecorate %RenderParams 1 Offset 64 | ||||
|                OpMemberDecorate %RenderParams 2 Offset 80 | ||||
|                OpDecorate %render_params NonWritable | ||||
|                OpDecorate %render_params Binding 0 | ||||
|                OpDecorate %render_params DescriptorSet 0 | ||||
|                OpDecorate %SimulationParams Block | ||||
|                OpMemberDecorate %SimulationParams 0 Offset 0 | ||||
|                OpMemberDecorate %SimulationParams 1 Offset 16 | ||||
|                OpDecorate %sim_params NonWritable | ||||
|                OpDecorate %sim_params Binding 0 | ||||
|                OpDecorate %sim_params DescriptorSet 0 | ||||
|                OpDecorate %Particles Block | ||||
|                OpMemberDecorate %Particles 0 Offset 0 | ||||
|                OpMemberDecorate %Particle 0 Offset 0 | ||||
|                OpMemberDecorate %Particle 1 Offset 12 | ||||
|                OpMemberDecorate %Particle 2 Offset 16 | ||||
|                OpMemberDecorate %Particle 3 Offset 32 | ||||
|                OpDecorate %_runtimearr_Particle ArrayStride 48 | ||||
|                OpDecorate %data Binding 1 | ||||
|                OpDecorate %data DescriptorSet 0 | ||||
|                OpDecorate %texture Binding 2 | ||||
|                OpDecorate %texture DescriptorSet 0 | ||||
|                OpDecorate %UBO Block | ||||
|                OpMemberDecorate %UBO 0 Offset 0 | ||||
|                OpDecorate %ubo NonWritable | ||||
|                OpDecorate %ubo Binding 3 | ||||
|                OpDecorate %ubo DescriptorSet 0 | ||||
|                OpDecorate %Buffer Block | ||||
|                OpMemberDecorate %Buffer 0 Offset 0 | ||||
|                OpDecorate %_runtimearr_float ArrayStride 4 | ||||
|                OpDecorate %buf_in NonWritable | ||||
|                OpDecorate %buf_in Binding 4 | ||||
|                OpDecorate %buf_in DescriptorSet 0 | ||||
|                OpDecorate %buf_out Binding 5 | ||||
|                OpDecorate %buf_out DescriptorSet 0 | ||||
|                OpDecorate %tex_in Binding 6 | ||||
|                OpDecorate %tex_in DescriptorSet 0 | ||||
|                OpDecorate %tex_out NonReadable | ||||
|                OpDecorate %tex_out Binding 7 | ||||
|                OpDecorate %tex_out DescriptorSet 0 | ||||
|                OpMemberDecorate %VertexOutput 0 Offset 0 | ||||
|                OpMemberDecorate %VertexOutput 1 Offset 16 | ||||
|                OpMemberDecorate %VertexOutput 2 Offset 32 | ||||
|                OpMemberDecorate %VertexInput 0 Offset 0 | ||||
|                OpMemberDecorate %VertexInput 1 Offset 16 | ||||
|                OpMemberDecorate %VertexInput 2 Offset 32 | ||||
|       %float = OpTypeFloat 32 | ||||
|     %v3float = OpTypeVector %float 3 | ||||
| %_ptr_Input_v3float = OpTypePointer Input %v3float | ||||
|  %position_1 = OpVariable %_ptr_Input_v3float Input | ||||
|     %v4float = OpTypeVector %float 4 | ||||
| %_ptr_Input_v4float = OpTypePointer Input %v4float | ||||
|     %color_1 = OpVariable %_ptr_Input_v4float Input | ||||
|     %v2float = OpTypeVector %float 2 | ||||
| %_ptr_Input_v2float = OpTypePointer Input %v2float | ||||
|  %quad_pos_1 = OpVariable %_ptr_Input_v2float Input | ||||
| %_ptr_Output_v4float = OpTypePointer Output %v4float | ||||
|          %13 = OpConstantNull %v4float | ||||
|  %position_2 = OpVariable %_ptr_Output_v4float Output %13 | ||||
|     %color_2 = OpVariable %_ptr_Output_v4float Output %13 | ||||
| %_ptr_Output_v2float = OpTypePointer Output %v2float | ||||
|          %17 = OpConstantNull %v2float | ||||
|  %quad_pos_2 = OpVariable %_ptr_Output_v2float Output %17 | ||||
| %_ptr_Output_float = OpTypePointer Output %float | ||||
|          %20 = OpConstantNull %float | ||||
| %vertex_point_size = OpVariable %_ptr_Output_float Output %20 | ||||
|  %position_3 = OpVariable %_ptr_Input_v4float Input | ||||
|     %color_3 = OpVariable %_ptr_Input_v4float Input | ||||
|  %quad_pos_3 = OpVariable %_ptr_Input_v2float Input | ||||
|     %value_1 = OpVariable %_ptr_Output_v4float Output %13 | ||||
|        %uint = OpTypeInt 32 0 | ||||
|      %v3uint = OpTypeVector %uint 3 | ||||
| %_ptr_Input_v3uint = OpTypePointer Input %v3uint | ||||
| %GlobalInvocationID_1 = OpVariable %_ptr_Input_v3uint Input | ||||
|     %coord_1 = OpVariable %_ptr_Input_v3uint Input | ||||
|     %coord_2 = OpVariable %_ptr_Input_v3uint Input | ||||
| %_ptr_Private_v2float = OpTypePointer Private %v2float | ||||
|   %rand_seed = OpVariable %_ptr_Private_v2float Private %17 | ||||
| %mat4v4float = OpTypeMatrix %v4float 4 | ||||
| %RenderParams = OpTypeStruct %mat4v4float %v3float %v3float | ||||
| %_ptr_Uniform_RenderParams = OpTypePointer Uniform %RenderParams | ||||
| %render_params = OpVariable %_ptr_Uniform_RenderParams Uniform | ||||
| %SimulationParams = OpTypeStruct %float %v4float | ||||
| %_ptr_Uniform_SimulationParams = OpTypePointer Uniform %SimulationParams | ||||
|  %sim_params = OpVariable %_ptr_Uniform_SimulationParams Uniform | ||||
|    %Particle = OpTypeStruct %v3float %float %v4float %v3float | ||||
| %_runtimearr_Particle = OpTypeRuntimeArray %Particle | ||||
|   %Particles = OpTypeStruct %_runtimearr_Particle | ||||
| %_ptr_StorageBuffer_Particles = OpTypePointer StorageBuffer %Particles | ||||
|        %data = OpVariable %_ptr_StorageBuffer_Particles StorageBuffer | ||||
|          %47 = OpTypeImage %float 2D 0 0 0 1 Unknown | ||||
| %_ptr_UniformConstant_47 = OpTypePointer UniformConstant %47 | ||||
|     %texture = OpVariable %_ptr_UniformConstant_47 UniformConstant | ||||
|         %UBO = OpTypeStruct %uint | ||||
| %_ptr_Uniform_UBO = OpTypePointer Uniform %UBO | ||||
|         %ubo = OpVariable %_ptr_Uniform_UBO Uniform | ||||
| %_runtimearr_float = OpTypeRuntimeArray %float | ||||
|      %Buffer = OpTypeStruct %_runtimearr_float | ||||
| %_ptr_StorageBuffer_Buffer = OpTypePointer StorageBuffer %Buffer | ||||
|      %buf_in = OpVariable %_ptr_StorageBuffer_Buffer StorageBuffer | ||||
|     %buf_out = OpVariable %_ptr_StorageBuffer_Buffer StorageBuffer | ||||
|      %tex_in = OpVariable %_ptr_UniformConstant_47 UniformConstant | ||||
|          %59 = OpTypeImage %float 2D 0 0 0 2 Rgba8 | ||||
| %_ptr_UniformConstant_59 = OpTypePointer UniformConstant %59 | ||||
|     %tex_out = OpVariable %_ptr_UniformConstant_59 UniformConstant | ||||
|          %60 = OpTypeFunction %float | ||||
|      %uint_0 = OpConstant %uint 0 | ||||
| %_ptr_Private_float = OpTypePointer Private %float | ||||
| %float_23_1407795 = OpConstant %float 23.1407795 | ||||
| %float_232_616898 = OpConstant %float 232.616898 | ||||
|          %73 = OpConstantComposite %v2float %float_23_1407795 %float_232_616898 | ||||
| %float_136_816803 = OpConstant %float 136.816803 | ||||
|      %uint_1 = OpConstant %uint 1 | ||||
| %float_54_4785652 = OpConstant %float 54.4785652 | ||||
| %float_345_841522 = OpConstant %float 345.841522 | ||||
|          %84 = OpConstantComposite %v2float %float_54_4785652 %float_345_841522 | ||||
| %float_534_764526 = OpConstant %float 534.764526 | ||||
| %VertexOutput = OpTypeStruct %v4float %v4float %v2float | ||||
| %VertexInput = OpTypeStruct %v3float %v4float %v2float | ||||
|          %89 = OpTypeFunction %VertexOutput %VertexInput | ||||
| %mat2v3float = OpTypeMatrix %v3float 2 | ||||
| %_ptr_Uniform_v3float = OpTypePointer Uniform %v3float | ||||
|      %uint_2 = OpConstant %uint 2 | ||||
| %_ptr_Function_v3float = OpTypePointer Function %v3float | ||||
|         %107 = OpConstantNull %v3float | ||||
| %float_0_00999999978 = OpConstant %float 0.00999999978 | ||||
| %_ptr_Function_VertexOutput = OpTypePointer Function %VertexOutput | ||||
|         %116 = OpConstantNull %VertexOutput | ||||
| %_ptr_Function_v4float = OpTypePointer Function %v4float | ||||
| %_ptr_Uniform_mat4v4float = OpTypePointer Uniform %mat4v4float | ||||
|     %float_1 = OpConstant %float 1 | ||||
| %_ptr_Function_v2float = OpTypePointer Function %v2float | ||||
|        %void = OpTypeVoid | ||||
|         %135 = OpTypeFunction %void | ||||
|         %147 = OpTypeFunction %v4float %VertexOutput | ||||
|      %uint_3 = OpConstant %uint 3 | ||||
| %_ptr_Function_float = OpTypePointer Function %float | ||||
|     %float_0 = OpConstant %float 0 | ||||
|         %172 = OpTypeFunction %void %v3uint | ||||
| %_ptr_Uniform_v4float = OpTypePointer Uniform %v4float | ||||
|      %v2uint = OpTypeVector %uint 2 | ||||
| %_ptr_StorageBuffer_Particle = OpTypePointer StorageBuffer %Particle | ||||
| %_ptr_Function_Particle = OpTypePointer Function %Particle | ||||
|         %194 = OpConstantNull %Particle | ||||
| %_ptr_Uniform_float = OpTypePointer Uniform %float | ||||
|   %float_0_5 = OpConstant %float 0.5 | ||||
|        %bool = OpTypeBool | ||||
|         %int = OpTypeInt 32 1 | ||||
|       %v2int = OpTypeVector %int 2 | ||||
|       %int_0 = OpConstant %int 0 | ||||
|         %232 = OpConstantComposite %v2int %int_0 %int_0 | ||||
| %_ptr_Function_v2int = OpTypePointer Function %v2int | ||||
|         %235 = OpConstantNull %v2int | ||||
|       %int_1 = OpConstant %int 1 | ||||
| %_ptr_Function_int = OpTypePointer Function %int | ||||
|         %242 = OpConstantNull %int | ||||
|      %v4bool = OpTypeVector %bool 4 | ||||
|       %int_2 = OpConstant %int 2 | ||||
|      %v2bool = OpTypeVector %bool 2 | ||||
|     %float_3 = OpConstant %float 3 | ||||
|    %float_n1 = OpConstant %float -1 | ||||
|         %302 = OpConstantComposite %v2float %float_1 %float_n1 | ||||
| %float_0_100000001 = OpConstant %float 0.100000001 | ||||
| %float_0_300000012 = OpConstant %float 0.300000012 | ||||
|     %float_2 = OpConstant %float 2 | ||||
| %_ptr_Uniform_uint = OpTypePointer Uniform %uint | ||||
| %_ptr_StorageBuffer_float = OpTypePointer StorageBuffer %float | ||||
|         %402 = OpConstantComposite %v4float %float_1 %float_1 %float_1 %float_1 | ||||
|     %float_4 = OpConstant %float 4 | ||||
| %float_9_99999975en05 = OpConstant %float 9.99999975e-05 | ||||
|        %rand = OpFunction %float None %60 | ||||
|          %62 = OpLabel | ||||
|          %65 = OpAccessChain %_ptr_Private_float %rand_seed %uint_0 | ||||
|          %70 = OpLoad %v2float %rand_seed | ||||
|          %69 = OpDot %float %70 %73 | ||||
|          %68 = OpExtInst %float %67 Cos %69 | ||||
|          %75 = OpFMul %float %68 %float_136_816803 | ||||
|          %66 = OpExtInst %float %67 Fract %75 | ||||
|                OpStore %65 %66 | ||||
|          %77 = OpAccessChain %_ptr_Private_float %rand_seed %uint_1 | ||||
|          %81 = OpLoad %v2float %rand_seed | ||||
|          %80 = OpDot %float %81 %84 | ||||
|          %79 = OpExtInst %float %67 Cos %80 | ||||
|          %86 = OpFMul %float %79 %float_534_764526 | ||||
|          %78 = OpExtInst %float %67 Fract %86 | ||||
|                OpStore %77 %78 | ||||
|          %87 = OpAccessChain %_ptr_Private_float %rand_seed %uint_1 | ||||
|          %88 = OpLoad %float %87 | ||||
|                OpReturnValue %88 | ||||
|                OpFunctionEnd | ||||
| %vs_main_inner = OpFunction %VertexOutput None %89 | ||||
|          %in = OpFunctionParameter %VertexInput | ||||
|          %94 = OpLabel | ||||
|    %quad_pos = OpVariable %_ptr_Function_v3float Function %107 | ||||
|    %position = OpVariable %_ptr_Function_v3float Function %107 | ||||
|         %out = OpVariable %_ptr_Function_VertexOutput Function %116 | ||||
|          %97 = OpAccessChain %_ptr_Uniform_v3float %render_params %uint_1 | ||||
|          %98 = OpLoad %v3float %97 | ||||
|         %100 = OpAccessChain %_ptr_Uniform_v3float %render_params %uint_2 | ||||
|         %101 = OpLoad %v3float %100 | ||||
|         %102 = OpCompositeConstruct %mat2v3float %98 %101 | ||||
|         %103 = OpCompositeExtract %v2float %in 2 | ||||
|         %104 = OpMatrixTimesVector %v3float %102 %103 | ||||
|                OpStore %quad_pos %104 | ||||
|         %108 = OpCompositeExtract %v3float %in 0 | ||||
|         %109 = OpLoad %v3float %quad_pos | ||||
|         %111 = OpVectorTimesScalar %v3float %109 %float_0_00999999978 | ||||
|         %112 = OpFAdd %v3float %108 %111 | ||||
|                OpStore %position %112 | ||||
|         %118 = OpAccessChain %_ptr_Function_v4float %out %uint_0 | ||||
|         %120 = OpAccessChain %_ptr_Uniform_mat4v4float %render_params %uint_0 | ||||
|         %121 = OpLoad %mat4v4float %120 | ||||
|         %122 = OpLoad %v3float %position | ||||
|         %123 = OpCompositeExtract %float %122 0 | ||||
|         %124 = OpCompositeExtract %float %122 1 | ||||
|         %125 = OpCompositeExtract %float %122 2 | ||||
|         %127 = OpCompositeConstruct %v4float %123 %124 %125 %float_1 | ||||
|         %128 = OpMatrixTimesVector %v4float %121 %127 | ||||
|                OpStore %118 %128 | ||||
|         %129 = OpAccessChain %_ptr_Function_v4float %out %uint_1 | ||||
|         %130 = OpCompositeExtract %v4float %in 1 | ||||
|                OpStore %129 %130 | ||||
|         %132 = OpAccessChain %_ptr_Function_v2float %out %uint_2 | ||||
|         %133 = OpCompositeExtract %v2float %in 2 | ||||
|                OpStore %132 %133 | ||||
|         %134 = OpLoad %VertexOutput %out | ||||
|                OpReturnValue %134 | ||||
|                OpFunctionEnd | ||||
|     %vs_main = OpFunction %void None %135 | ||||
|         %138 = OpLabel | ||||
|         %140 = OpLoad %v3float %position_1 | ||||
|         %141 = OpLoad %v4float %color_1 | ||||
|         %142 = OpLoad %v2float %quad_pos_1 | ||||
|         %143 = OpCompositeConstruct %VertexInput %140 %141 %142 | ||||
|         %139 = OpFunctionCall %VertexOutput %vs_main_inner %143 | ||||
|         %144 = OpCompositeExtract %v4float %139 0 | ||||
|                OpStore %position_2 %144 | ||||
|         %145 = OpCompositeExtract %v4float %139 1 | ||||
|                OpStore %color_2 %145 | ||||
|         %146 = OpCompositeExtract %v2float %139 2 | ||||
|                OpStore %quad_pos_2 %146 | ||||
|                OpStore %vertex_point_size %float_1 | ||||
|                OpReturn | ||||
|                OpFunctionEnd | ||||
| %fs_main_inner = OpFunction %v4float None %147 | ||||
|        %in_0 = OpFunctionParameter %VertexOutput | ||||
|         %150 = OpLabel | ||||
|       %color = OpVariable %_ptr_Function_v4float Function %13 | ||||
|         %151 = OpCompositeExtract %v4float %in_0 1 | ||||
|                OpStore %color %151 | ||||
|         %155 = OpAccessChain %_ptr_Function_float %color %uint_3 | ||||
|         %156 = OpAccessChain %_ptr_Function_float %color %uint_3 | ||||
|         %157 = OpLoad %float %156 | ||||
|         %160 = OpCompositeExtract %v2float %in_0 2 | ||||
|         %159 = OpExtInst %float %67 Length %160 | ||||
|         %161 = OpFSub %float %float_1 %159 | ||||
|         %158 = OpExtInst %float %67 NMax %161 %float_0 | ||||
|         %163 = OpFMul %float %157 %158 | ||||
|                OpStore %155 %163 | ||||
|         %164 = OpLoad %v4float %color | ||||
|                OpReturnValue %164 | ||||
|                OpFunctionEnd | ||||
|     %fs_main = OpFunction %void None %135 | ||||
|         %166 = OpLabel | ||||
|         %168 = OpLoad %v4float %position_3 | ||||
|         %169 = OpLoad %v4float %color_3 | ||||
|         %170 = OpLoad %v2float %quad_pos_3 | ||||
|         %171 = OpCompositeConstruct %VertexOutput %168 %169 %170 | ||||
|         %167 = OpFunctionCall %v4float %fs_main_inner %171 | ||||
|                OpStore %value_1 %167 | ||||
|                OpReturn | ||||
|                OpFunctionEnd | ||||
| %simulate_inner = OpFunction %void None %172 | ||||
| %GlobalInvocationID = OpFunctionParameter %v3uint | ||||
|         %175 = OpLabel | ||||
|    %particle = OpVariable %_ptr_Function_Particle Function %194 | ||||
|       %coord = OpVariable %_ptr_Function_v2int Function %235 | ||||
|       %level = OpVariable %_ptr_Function_int Function %242 | ||||
|         %270 = OpVariable %_ptr_Function_v2int Function %235 | ||||
|         %297 = OpVariable %_ptr_Function_v2float Function %17 | ||||
|         %177 = OpAccessChain %_ptr_Uniform_v4float %sim_params %uint_1 | ||||
|         %178 = OpLoad %v4float %177 | ||||
|         %179 = OpVectorShuffle %v2float %178 %178 0 1 | ||||
|         %182 = OpVectorShuffle %v2uint %GlobalInvocationID %GlobalInvocationID 0 1 | ||||
|         %180 = OpConvertUToF %v2float %182 | ||||
|         %183 = OpFAdd %v2float %179 %180 | ||||
|         %184 = OpAccessChain %_ptr_Uniform_v4float %sim_params %uint_1 | ||||
|         %185 = OpLoad %v4float %184 | ||||
|         %186 = OpVectorShuffle %v2float %185 %185 2 3 | ||||
|         %187 = OpFMul %v2float %183 %186 | ||||
|                OpStore %rand_seed %187 | ||||
|         %188 = OpCompositeExtract %uint %GlobalInvocationID 0 | ||||
|         %190 = OpAccessChain %_ptr_StorageBuffer_Particle %data %uint_0 %188 | ||||
|         %191 = OpLoad %Particle %190 | ||||
|                OpStore %particle %191 | ||||
|         %195 = OpAccessChain %_ptr_Function_float %particle %uint_3 %uint_2 | ||||
|         %196 = OpAccessChain %_ptr_Function_float %particle %uint_3 %uint_2 | ||||
|         %197 = OpLoad %float %196 | ||||
|         %199 = OpAccessChain %_ptr_Uniform_float %sim_params %uint_0 | ||||
|         %200 = OpLoad %float %199 | ||||
|         %202 = OpFMul %float %200 %float_0_5 | ||||
|         %203 = OpFSub %float %197 %202 | ||||
|                OpStore %195 %203 | ||||
|         %204 = OpAccessChain %_ptr_Function_v3float %particle %uint_0 | ||||
|         %205 = OpAccessChain %_ptr_Function_v3float %particle %uint_0 | ||||
|         %206 = OpLoad %v3float %205 | ||||
|         %207 = OpAccessChain %_ptr_Uniform_float %sim_params %uint_0 | ||||
|         %208 = OpLoad %float %207 | ||||
|         %209 = OpAccessChain %_ptr_Function_v3float %particle %uint_3 | ||||
|         %210 = OpLoad %v3float %209 | ||||
|         %211 = OpVectorTimesScalar %v3float %210 %208 | ||||
|         %212 = OpFAdd %v3float %206 %211 | ||||
|                OpStore %204 %212 | ||||
|         %213 = OpAccessChain %_ptr_Function_float %particle %uint_1 | ||||
|         %214 = OpAccessChain %_ptr_Function_float %particle %uint_1 | ||||
|         %215 = OpLoad %float %214 | ||||
|         %216 = OpAccessChain %_ptr_Uniform_float %sim_params %uint_0 | ||||
|         %217 = OpLoad %float %216 | ||||
|         %218 = OpFSub %float %215 %217 | ||||
|                OpStore %213 %218 | ||||
|         %219 = OpAccessChain %_ptr_Function_float %particle %uint_2 %uint_3 | ||||
|         %221 = OpAccessChain %_ptr_Function_float %particle %uint_1 | ||||
|         %222 = OpLoad %float %221 | ||||
|         %220 = OpExtInst %float %67 SmoothStep %float_0 %float_0_5 %222 | ||||
|                OpStore %219 %220 | ||||
|         %223 = OpAccessChain %_ptr_Function_float %particle %uint_1 | ||||
|         %224 = OpLoad %float %223 | ||||
|         %225 = OpFOrdLessThan %bool %224 %float_0 | ||||
|                OpSelectionMerge %227 None | ||||
|                OpBranchConditional %225 %228 %227 | ||||
|         %228 = OpLabel | ||||
|                OpStore %coord %232 | ||||
|         %237 = OpLoad %47 %texture | ||||
|         %236 = OpImageQueryLevels %int %237 | ||||
|         %239 = OpISub %int %236 %int_1 | ||||
|                OpStore %level %239 | ||||
|                OpBranch %243 | ||||
|         %243 = OpLabel | ||||
|                OpLoopMerge %244 %245 None | ||||
|                OpBranch %246 | ||||
|         %246 = OpLabel | ||||
|         %248 = OpLoad %int %level | ||||
|         %249 = OpSGreaterThan %bool %248 %int_0 | ||||
|         %247 = OpLogicalNot %bool %249 | ||||
|                OpSelectionMerge %250 None | ||||
|                OpBranchConditional %247 %251 %250 | ||||
|         %251 = OpLabel | ||||
|                OpBranch %244 | ||||
|         %250 = OpLabel | ||||
|         %253 = OpLoad %47 %texture | ||||
|         %254 = OpLoad %v2int %coord | ||||
|         %255 = OpLoad %int %level | ||||
|         %252 = OpImageFetch %v4float %253 %254 Lod %255 | ||||
|         %256 = OpFunctionCall %float %rand | ||||
|         %257 = OpCompositeConstruct %v4float %256 %256 %256 %256 | ||||
|         %258 = OpVectorShuffle %v3float %252 %252 0 1 2 | ||||
|         %259 = OpCompositeExtract %float %258 0 | ||||
|         %260 = OpCompositeExtract %float %258 1 | ||||
|         %261 = OpCompositeExtract %float %258 2 | ||||
|         %262 = OpCompositeConstruct %v4float %float_0 %259 %260 %261 | ||||
|         %263 = OpFOrdGreaterThanEqual %v4bool %257 %262 | ||||
|         %265 = OpFOrdLessThan %v4bool %257 %252 | ||||
|         %266 = OpLogicalAnd %v4bool %263 %265 | ||||
|         %267 = OpLoad %v2int %coord | ||||
|         %271 = OpCompositeConstruct %v2int %int_2 %int_2 | ||||
|         %269 = OpIMul %v2int %267 %271 | ||||
|                OpStore %coord %269 | ||||
|         %272 = OpAccessChain %_ptr_Function_int %coord %uint_0 | ||||
|         %273 = OpAccessChain %_ptr_Function_int %coord %uint_0 | ||||
|         %274 = OpLoad %int %273 | ||||
|         %278 = OpVectorShuffle %v2bool %266 %266 1 3 | ||||
|         %276 = OpAny %bool %278 | ||||
|         %275 = OpSelect %int %276 %int_1 %int_0 | ||||
|         %279 = OpIAdd %int %274 %275 | ||||
|                OpStore %272 %279 | ||||
|         %280 = OpAccessChain %_ptr_Function_int %coord %uint_1 | ||||
|         %281 = OpAccessChain %_ptr_Function_int %coord %uint_1 | ||||
|         %282 = OpLoad %int %281 | ||||
|         %285 = OpVectorShuffle %v2bool %266 %266 2 3 | ||||
|         %284 = OpAny %bool %285 | ||||
|         %283 = OpSelect %int %284 %int_1 %int_0 | ||||
|         %286 = OpIAdd %int %282 %283 | ||||
|                OpStore %280 %286 | ||||
|                OpBranch %245 | ||||
|         %245 = OpLabel | ||||
|         %287 = OpLoad %int %level | ||||
|         %288 = OpISub %int %287 %int_1 | ||||
|                OpStore %level %288 | ||||
|                OpBranch %243 | ||||
|         %244 = OpLabel | ||||
|         %290 = OpLoad %v2int %coord | ||||
|         %289 = OpConvertSToF %v2float %290 | ||||
|         %293 = OpLoad %47 %texture | ||||
|         %292 = OpImageQuerySizeLod %v2int %293 %int_0 | ||||
|         %291 = OpConvertSToF %v2float %292 | ||||
|         %294 = OpFDiv %v2float %289 %291 | ||||
|         %295 = OpAccessChain %_ptr_Function_v3float %particle %uint_0 | ||||
|         %298 = OpCompositeConstruct %v2float %float_0_5 %float_0_5 | ||||
|         %296 = OpFSub %v2float %294 %298 | ||||
|         %300 = OpVectorTimesScalar %v2float %296 %float_3 | ||||
|         %303 = OpFMul %v2float %300 %302 | ||||
|         %304 = OpCompositeExtract %float %303 0 | ||||
|         %305 = OpCompositeExtract %float %303 1 | ||||
|         %306 = OpCompositeConstruct %v3float %304 %305 %float_0 | ||||
|                OpStore %295 %306 | ||||
|         %307 = OpAccessChain %_ptr_Function_v4float %particle %uint_2 | ||||
|         %309 = OpLoad %47 %texture | ||||
|         %310 = OpLoad %v2int %coord | ||||
|         %308 = OpImageFetch %v4float %309 %310 Lod %int_0 | ||||
|                OpStore %307 %308 | ||||
|         %311 = OpAccessChain %_ptr_Function_float %particle %uint_3 %uint_0 | ||||
|         %312 = OpFunctionCall %float %rand | ||||
|         %313 = OpFSub %float %312 %float_0_5 | ||||
|         %315 = OpFMul %float %313 %float_0_100000001 | ||||
|                OpStore %311 %315 | ||||
|         %316 = OpAccessChain %_ptr_Function_float %particle %uint_3 %uint_1 | ||||
|         %317 = OpFunctionCall %float %rand | ||||
|         %318 = OpFSub %float %317 %float_0_5 | ||||
|         %319 = OpFMul %float %318 %float_0_100000001 | ||||
|                OpStore %316 %319 | ||||
|         %320 = OpAccessChain %_ptr_Function_float %particle %uint_3 %uint_2 | ||||
|         %321 = OpFunctionCall %float %rand | ||||
|         %323 = OpFMul %float %321 %float_0_300000012 | ||||
|                OpStore %320 %323 | ||||
|         %324 = OpAccessChain %_ptr_Function_float %particle %uint_1 | ||||
|         %325 = OpFunctionCall %float %rand | ||||
|         %327 = OpFMul %float %325 %float_2 | ||||
|         %328 = OpFAdd %float %float_0_5 %327 | ||||
|                OpStore %324 %328 | ||||
|                OpBranch %227 | ||||
|         %227 = OpLabel | ||||
|         %329 = OpAccessChain %_ptr_StorageBuffer_Particle %data %uint_0 %188 | ||||
|         %330 = OpLoad %Particle %particle | ||||
|                OpStore %329 %330 | ||||
|                OpReturn | ||||
|                OpFunctionEnd | ||||
|    %simulate = OpFunction %void None %135 | ||||
|         %332 = OpLabel | ||||
|         %334 = OpLoad %v3uint %GlobalInvocationID_1 | ||||
|         %333 = OpFunctionCall %void %simulate_inner %334 | ||||
|                OpReturn | ||||
|                OpFunctionEnd | ||||
| %import_level_inner = OpFunction %void None %172 | ||||
|     %coord_0 = OpFunctionParameter %v3uint | ||||
|         %337 = OpLabel | ||||
|         %339 = OpCompositeExtract %uint %coord_0 0 | ||||
|         %340 = OpCompositeExtract %uint %coord_0 1 | ||||
|         %342 = OpAccessChain %_ptr_Uniform_uint %ubo %uint_0 | ||||
|         %343 = OpLoad %uint %342 | ||||
|         %344 = OpIMul %uint %340 %343 | ||||
|         %345 = OpIAdd %uint %339 %344 | ||||
|         %347 = OpAccessChain %_ptr_StorageBuffer_float %buf_out %uint_0 %345 | ||||
|         %349 = OpLoad %47 %tex_in | ||||
|         %351 = OpVectorShuffle %v2uint %coord_0 %coord_0 0 1 | ||||
|         %350 = OpBitcast %v2int %351 | ||||
|         %348 = OpImageFetch %v4float %349 %350 Lod %int_0 | ||||
|         %352 = OpCompositeExtract %float %348 3 | ||||
|                OpStore %347 %352 | ||||
|                OpReturn | ||||
|                OpFunctionEnd | ||||
| %import_level = OpFunction %void None %135 | ||||
|         %354 = OpLabel | ||||
|         %356 = OpLoad %v3uint %coord_1 | ||||
|         %355 = OpFunctionCall %void %import_level_inner %356 | ||||
|                OpReturn | ||||
|                OpFunctionEnd | ||||
| %export_level_inner = OpFunction %void None %172 | ||||
|     %coord_3 = OpFunctionParameter %v3uint | ||||
|         %359 = OpLabel | ||||
|         %413 = OpVariable %_ptr_Function_v4float Function %13 | ||||
|         %361 = OpVectorShuffle %v2uint %coord_3 %coord_3 0 1 | ||||
|         %364 = OpLoad %59 %tex_out | ||||
|         %363 = OpImageQuerySize %v2int %364 | ||||
|         %362 = OpBitcast %v2uint %363 | ||||
|         %365 = OpULessThan %v2bool %361 %362 | ||||
|         %360 = OpAll %bool %365 | ||||
|                OpSelectionMerge %366 None | ||||
|                OpBranchConditional %360 %367 %366 | ||||
|         %367 = OpLabel | ||||
|         %368 = OpCompositeExtract %uint %coord_3 0 | ||||
|         %369 = OpCompositeExtract %uint %coord_3 1 | ||||
|         %370 = OpAccessChain %_ptr_Uniform_uint %ubo %uint_0 | ||||
|         %371 = OpLoad %uint %370 | ||||
|         %372 = OpIMul %uint %369 %371 | ||||
|         %373 = OpIAdd %uint %368 %372 | ||||
|         %374 = OpCompositeExtract %uint %coord_3 0 | ||||
|         %375 = OpIMul %uint %374 %uint_2 | ||||
|         %376 = OpCompositeExtract %uint %coord_3 1 | ||||
|         %377 = OpIMul %uint %376 %uint_2 | ||||
|         %378 = OpAccessChain %_ptr_Uniform_uint %ubo %uint_0 | ||||
|         %379 = OpLoad %uint %378 | ||||
|         %380 = OpIMul %uint %377 %379 | ||||
|         %381 = OpIAdd %uint %375 %380 | ||||
|         %382 = OpIAdd %uint %381 %uint_0 | ||||
|         %383 = OpAccessChain %_ptr_StorageBuffer_float %buf_in %uint_0 %382 | ||||
|         %384 = OpLoad %float %383 | ||||
|         %385 = OpIAdd %uint %381 %uint_1 | ||||
|         %386 = OpAccessChain %_ptr_StorageBuffer_float %buf_in %uint_0 %385 | ||||
|         %387 = OpLoad %float %386 | ||||
|         %388 = OpIAdd %uint %381 %uint_0 | ||||
|         %389 = OpAccessChain %_ptr_Uniform_uint %ubo %uint_0 | ||||
|         %390 = OpLoad %uint %389 | ||||
|         %391 = OpIAdd %uint %388 %390 | ||||
|         %392 = OpAccessChain %_ptr_StorageBuffer_float %buf_in %uint_0 %391 | ||||
|         %393 = OpLoad %float %392 | ||||
|         %394 = OpIAdd %uint %381 %uint_1 | ||||
|         %395 = OpAccessChain %_ptr_Uniform_uint %ubo %uint_0 | ||||
|         %396 = OpLoad %uint %395 | ||||
|         %397 = OpIAdd %uint %394 %396 | ||||
|         %398 = OpAccessChain %_ptr_StorageBuffer_float %buf_in %uint_0 %397 | ||||
|         %399 = OpLoad %float %398 | ||||
|         %401 = OpCompositeConstruct %v4float %384 %387 %393 %399 | ||||
|         %400 = OpDot %float %401 %402 | ||||
|         %403 = OpAccessChain %_ptr_StorageBuffer_float %buf_out %uint_0 %373 | ||||
|         %405 = OpFDiv %float %400 %float_4 | ||||
|                OpStore %403 %405 | ||||
|         %406 = OpFAdd %float %384 %387 | ||||
|         %407 = OpFAdd %float %384 %387 | ||||
|         %408 = OpFAdd %float %407 %393 | ||||
|         %409 = OpCompositeConstruct %v4float %384 %406 %408 %400 | ||||
|         %410 = OpExtInst %float %67 NMax %400 %float_9_99999975en05 | ||||
|         %414 = OpCompositeConstruct %v4float %410 %410 %410 %410 | ||||
|         %412 = OpFDiv %v4float %409 %414 | ||||
|         %416 = OpLoad %59 %tex_out | ||||
|         %418 = OpVectorShuffle %v2uint %coord_3 %coord_3 0 1 | ||||
|         %417 = OpBitcast %v2int %418 | ||||
|                OpImageWrite %416 %417 %412 | ||||
|                OpBranch %366 | ||||
|         %366 = OpLabel | ||||
|                OpReturn | ||||
|                OpFunctionEnd | ||||
| %export_level = OpFunction %void None %135 | ||||
|         %420 = OpLabel | ||||
|         %422 = OpLoad %v3uint %coord_2 | ||||
|         %421 = OpFunctionCall %void %export_level_inner %422 | ||||
|                OpReturn | ||||
|                OpFunctionEnd | ||||
							
								
								
									
										144
									
								
								test/benchmark/particles.wgsl.expected.wgsl
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										144
									
								
								test/benchmark/particles.wgsl.expected.wgsl
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,144 @@ | ||||
| var<private> rand_seed : vec2<f32>; | ||||
| 
 | ||||
| fn rand() -> f32 { | ||||
|   rand_seed.x = fract((cos(dot(rand_seed, vec2<f32>(23.140779495, 232.616897583))) * 136.816802979)); | ||||
|   rand_seed.y = fract((cos(dot(rand_seed, vec2<f32>(54.478565216, 345.841522217))) * 534.764526367)); | ||||
|   return rand_seed.y; | ||||
| } | ||||
| 
 | ||||
| struct RenderParams { | ||||
|   modelViewProjectionMatrix : mat4x4<f32>; | ||||
|   right : vec3<f32>; | ||||
|   up : vec3<f32>; | ||||
| }; | ||||
| 
 | ||||
| [[binding(0), group(0)]] var<uniform> render_params : RenderParams; | ||||
| 
 | ||||
| struct VertexInput { | ||||
|   [[location(0)]] | ||||
|   position : vec3<f32>; | ||||
|   [[location(1)]] | ||||
|   color : vec4<f32>; | ||||
|   [[location(2)]] | ||||
|   quad_pos : vec2<f32>; | ||||
| }; | ||||
| 
 | ||||
| struct VertexOutput { | ||||
|   [[builtin(position)]] | ||||
|   position : vec4<f32>; | ||||
|   [[location(0)]] | ||||
|   color : vec4<f32>; | ||||
|   [[location(1)]] | ||||
|   quad_pos : vec2<f32>; | ||||
| }; | ||||
| 
 | ||||
| [[stage(vertex)]] | ||||
| fn vs_main(in : VertexInput) -> VertexOutput { | ||||
|   var quad_pos = (mat2x3<f32>(render_params.right, render_params.up) * in.quad_pos); | ||||
|   var position = (in.position + (quad_pos * 0.01)); | ||||
|   var out : VertexOutput; | ||||
|   out.position = (render_params.modelViewProjectionMatrix * vec4<f32>(position, 1.0)); | ||||
|   out.color = in.color; | ||||
|   out.quad_pos = in.quad_pos; | ||||
|   return out; | ||||
| } | ||||
| 
 | ||||
| [[stage(fragment)]] | ||||
| fn fs_main(in : VertexOutput) -> [[location(0)]] vec4<f32> { | ||||
|   var color = in.color; | ||||
|   color.a = (color.a * max((1.0 - length(in.quad_pos)), 0.0)); | ||||
|   return color; | ||||
| } | ||||
| 
 | ||||
| struct SimulationParams { | ||||
|   deltaTime : f32; | ||||
|   seed : vec4<f32>; | ||||
| }; | ||||
| 
 | ||||
| struct Particle { | ||||
|   position : vec3<f32>; | ||||
|   lifetime : f32; | ||||
|   color : vec4<f32>; | ||||
|   velocity : vec3<f32>; | ||||
| }; | ||||
| 
 | ||||
| struct Particles { | ||||
|   particles : array<Particle>; | ||||
| }; | ||||
| 
 | ||||
| [[binding(0), group(0)]] var<uniform> sim_params : SimulationParams; | ||||
| 
 | ||||
| [[binding(1), group(0)]] var<storage, read_write> data : Particles; | ||||
| 
 | ||||
| [[binding(2), group(0)]] var texture : texture_2d<f32>; | ||||
| 
 | ||||
| [[stage(compute), workgroup_size(64)]] | ||||
| fn simulate([[builtin(global_invocation_id)]] GlobalInvocationID : vec3<u32>) { | ||||
|   rand_seed = ((sim_params.seed.xy + vec2<f32>(GlobalInvocationID.xy)) * sim_params.seed.zw); | ||||
|   let idx = GlobalInvocationID.x; | ||||
|   var particle = data.particles[idx]; | ||||
|   particle.velocity.z = (particle.velocity.z - (sim_params.deltaTime * 0.5)); | ||||
|   particle.position = (particle.position + (sim_params.deltaTime * particle.velocity)); | ||||
|   particle.lifetime = (particle.lifetime - sim_params.deltaTime); | ||||
|   particle.color.a = smoothStep(0.0, 0.5, particle.lifetime); | ||||
|   if ((particle.lifetime < 0.0)) { | ||||
|     var coord = vec2<i32>(0, 0); | ||||
|     for(var level = (textureNumLevels(texture) - 1); (level > 0); level = (level - 1)) { | ||||
|       let probabilites = textureLoad(texture, coord, level); | ||||
|       let value = vec4<f32>(rand()); | ||||
|       let mask = ((value >= vec4<f32>(0.0, probabilites.xyz)) & (value < probabilites)); | ||||
|       coord = (coord * 2); | ||||
|       coord.x = (coord.x + select(0, 1, any(mask.yw))); | ||||
|       coord.y = (coord.y + select(0, 1, any(mask.zw))); | ||||
|     } | ||||
|     let uv = (vec2<f32>(coord) / vec2<f32>(textureDimensions(texture))); | ||||
|     particle.position = vec3<f32>((((uv - 0.5) * 3.0) * vec2<f32>(1.0, -1.0)), 0.0); | ||||
|     particle.color = textureLoad(texture, coord, 0); | ||||
|     particle.velocity.x = ((rand() - 0.5) * 0.100000001); | ||||
|     particle.velocity.y = ((rand() - 0.5) * 0.100000001); | ||||
|     particle.velocity.z = (rand() * 0.300000012); | ||||
|     particle.lifetime = (0.5 + (rand() * 2.0)); | ||||
|   } | ||||
|   data.particles[idx] = particle; | ||||
| } | ||||
| 
 | ||||
| struct UBO { | ||||
|   width : u32; | ||||
| }; | ||||
| 
 | ||||
| struct Buffer { | ||||
|   weights : array<f32>; | ||||
| }; | ||||
| 
 | ||||
| [[binding(3), group(0)]] var<uniform> ubo : UBO; | ||||
| 
 | ||||
| [[binding(4), group(0)]] var<storage, read> buf_in : Buffer; | ||||
| 
 | ||||
| [[binding(5), group(0)]] var<storage, read_write> buf_out : Buffer; | ||||
| 
 | ||||
| [[binding(6), group(0)]] var tex_in : texture_2d<f32>; | ||||
| 
 | ||||
| [[binding(7), group(0)]] var tex_out : texture_storage_2d<rgba8unorm, write>; | ||||
| 
 | ||||
| [[stage(compute), workgroup_size(64)]] | ||||
| fn import_level([[builtin(global_invocation_id)]] coord : vec3<u32>) { | ||||
|   _ = &(buf_in); | ||||
|   let offset = (coord.x + (coord.y * ubo.width)); | ||||
|   buf_out.weights[offset] = textureLoad(tex_in, vec2<i32>(coord.xy), 0).w; | ||||
| } | ||||
| 
 | ||||
| [[stage(compute), workgroup_size(64)]] | ||||
| fn export_level([[builtin(global_invocation_id)]] coord : vec3<u32>) { | ||||
|   if (all((coord.xy < vec2<u32>(textureDimensions(tex_out))))) { | ||||
|     let dst_offset = (coord.x + (coord.y * ubo.width)); | ||||
|     let src_offset = ((coord.x * 2u) + ((coord.y * 2u) * ubo.width)); | ||||
|     let a = buf_in.weights[(src_offset + 0u)]; | ||||
|     let b = buf_in.weights[(src_offset + 1u)]; | ||||
|     let c = buf_in.weights[((src_offset + 0u) + ubo.width)]; | ||||
|     let d = buf_in.weights[((src_offset + 1u) + ubo.width)]; | ||||
|     let sum = dot(vec4<f32>(a, b, c, d), vec4<f32>(1.0)); | ||||
|     buf_out.weights[dst_offset] = (sum / 4.0); | ||||
|     let probabilities = (vec4<f32>(a, (a + b), ((a + b) + c), sum) / max(sum, 0.0001)); | ||||
|     textureStore(tex_out, vec2<i32>(coord.xy), probabilities); | ||||
|   } | ||||
| } | ||||
							
								
								
									
										10
									
								
								test/benchmark/simple_compute.wgsl
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										10
									
								
								test/benchmark/simple_compute.wgsl
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,10 @@ | ||||
| struct SB { | ||||
|   data : array<i32>; | ||||
| }; | ||||
| 
 | ||||
| [[group(0), binding(0)]] var<storage, read_write> buffer : SB; | ||||
| 
 | ||||
| [[stage(compute), workgroup_size(1, 2, 3)]] | ||||
| fn main([[builtin(global_invocation_id)]] id : vec3<u32>) { | ||||
|   buffer.data[id.x] = buffer.data[id.x] + 1; | ||||
| } | ||||
							
								
								
									
										15
									
								
								test/benchmark/simple_compute.wgsl.expected.hlsl
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										15
									
								
								test/benchmark/simple_compute.wgsl.expected.hlsl
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,15 @@ | ||||
| RWByteAddressBuffer buffer : register(u0, space0); | ||||
| 
 | ||||
| struct tint_symbol_1 { | ||||
|   uint3 id : SV_DispatchThreadID; | ||||
| }; | ||||
| 
 | ||||
| void main_inner(uint3 id) { | ||||
|   buffer.Store((4u * id.x), asuint((asint(buffer.Load((4u * id.x))) + 1))); | ||||
| } | ||||
| 
 | ||||
| [numthreads(1, 2, 3)] | ||||
| void main(tint_symbol_1 tint_symbol) { | ||||
|   main_inner(tint_symbol.id); | ||||
|   return; | ||||
| } | ||||
							
								
								
									
										16
									
								
								test/benchmark/simple_compute.wgsl.expected.msl
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										16
									
								
								test/benchmark/simple_compute.wgsl.expected.msl
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,16 @@ | ||||
| #include <metal_stdlib> | ||||
| 
 | ||||
| using namespace metal; | ||||
| struct SB { | ||||
|   /* 0x0000 */ int data[1]; | ||||
| }; | ||||
| 
 | ||||
| void tint_symbol_1_inner(uint3 id, device SB* const tint_symbol_2) { | ||||
|   (*(tint_symbol_2)).data[id[0]] = as_type<int>((as_type<uint>((*(tint_symbol_2)).data[id[0]]) + as_type<uint>(1))); | ||||
| } | ||||
| 
 | ||||
| kernel void tint_symbol_1(device SB* tint_symbol_3 [[buffer(0)]], uint3 id [[thread_position_in_grid]]) { | ||||
|   tint_symbol_1_inner(id, tint_symbol_3); | ||||
|   return; | ||||
| } | ||||
| 
 | ||||
							
								
								
									
										55
									
								
								test/benchmark/simple_compute.wgsl.expected.spvasm
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										55
									
								
								test/benchmark/simple_compute.wgsl.expected.spvasm
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,55 @@ | ||||
| ; SPIR-V | ||||
| ; Version: 1.3 | ||||
| ; Generator: Google Tint Compiler; 0 | ||||
| ; Bound: 29 | ||||
| ; Schema: 0 | ||||
|                OpCapability Shader | ||||
|                OpMemoryModel Logical GLSL450 | ||||
|                OpEntryPoint GLCompute %main "main" %id_1 | ||||
|                OpExecutionMode %main LocalSize 1 2 3 | ||||
|                OpName %id_1 "id_1" | ||||
|                OpName %SB "SB" | ||||
|                OpMemberName %SB 0 "data" | ||||
|                OpName %buffer "buffer" | ||||
|                OpName %main_inner "main_inner" | ||||
|                OpName %id "id" | ||||
|                OpName %main "main" | ||||
|                OpDecorate %id_1 BuiltIn GlobalInvocationId | ||||
|                OpDecorate %SB Block | ||||
|                OpMemberDecorate %SB 0 Offset 0 | ||||
|                OpDecorate %_runtimearr_int ArrayStride 4 | ||||
|                OpDecorate %buffer DescriptorSet 0 | ||||
|                OpDecorate %buffer Binding 0 | ||||
|        %uint = OpTypeInt 32 0 | ||||
|      %v3uint = OpTypeVector %uint 3 | ||||
| %_ptr_Input_v3uint = OpTypePointer Input %v3uint | ||||
|        %id_1 = OpVariable %_ptr_Input_v3uint Input | ||||
|         %int = OpTypeInt 32 1 | ||||
| %_runtimearr_int = OpTypeRuntimeArray %int | ||||
|          %SB = OpTypeStruct %_runtimearr_int | ||||
| %_ptr_StorageBuffer_SB = OpTypePointer StorageBuffer %SB | ||||
|      %buffer = OpVariable %_ptr_StorageBuffer_SB StorageBuffer | ||||
|        %void = OpTypeVoid | ||||
|          %10 = OpTypeFunction %void %v3uint | ||||
|      %uint_0 = OpConstant %uint 0 | ||||
| %_ptr_StorageBuffer_int = OpTypePointer StorageBuffer %int | ||||
|       %int_1 = OpConstant %int 1 | ||||
|          %24 = OpTypeFunction %void | ||||
|  %main_inner = OpFunction %void None %10 | ||||
|          %id = OpFunctionParameter %v3uint | ||||
|          %14 = OpLabel | ||||
|          %16 = OpCompositeExtract %uint %id 0 | ||||
|          %18 = OpAccessChain %_ptr_StorageBuffer_int %buffer %uint_0 %16 | ||||
|          %19 = OpCompositeExtract %uint %id 0 | ||||
|          %20 = OpAccessChain %_ptr_StorageBuffer_int %buffer %uint_0 %19 | ||||
|          %21 = OpLoad %int %20 | ||||
|          %23 = OpIAdd %int %21 %int_1 | ||||
|                OpStore %18 %23 | ||||
|                OpReturn | ||||
|                OpFunctionEnd | ||||
|        %main = OpFunction %void None %24 | ||||
|          %26 = OpLabel | ||||
|          %28 = OpLoad %v3uint %id_1 | ||||
|          %27 = OpFunctionCall %void %main_inner %28 | ||||
|                OpReturn | ||||
|                OpFunctionEnd | ||||
							
								
								
									
										10
									
								
								test/benchmark/simple_compute.wgsl.expected.wgsl
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										10
									
								
								test/benchmark/simple_compute.wgsl.expected.wgsl
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,10 @@ | ||||
| struct SB { | ||||
|   data : array<i32>; | ||||
| }; | ||||
| 
 | ||||
| [[group(0), binding(0)]] var<storage, read_write> buffer : SB; | ||||
| 
 | ||||
| [[stage(compute), workgroup_size(1, 2, 3)]] | ||||
| fn main([[builtin(global_invocation_id)]] id : vec3<u32>) { | ||||
|   buffer.data[id.x] = (buffer.data[id.x] + 1); | ||||
| } | ||||
							
								
								
									
										12
									
								
								test/benchmark/simple_fragment.wgsl
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										12
									
								
								test/benchmark/simple_fragment.wgsl
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,12 @@ | ||||
| struct Input { | ||||
|   [[location(0)]] color: vec4<f32>; | ||||
| }; | ||||
| 
 | ||||
| struct Output { | ||||
|   [[location(0)]] color: vec4<f32>; | ||||
| }; | ||||
| 
 | ||||
| [[stage(fragment)]] | ||||
| fn main(in : Input) -> Output { | ||||
|   return Output(in.color); | ||||
| } | ||||
							
								
								
									
										25
									
								
								test/benchmark/simple_fragment.wgsl.expected.hlsl
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										25
									
								
								test/benchmark/simple_fragment.wgsl.expected.hlsl
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,25 @@ | ||||
| struct Input { | ||||
|   float4 color; | ||||
| }; | ||||
| struct Output { | ||||
|   float4 color; | ||||
| }; | ||||
| struct tint_symbol_2 { | ||||
|   float4 color : TEXCOORD0; | ||||
| }; | ||||
| struct tint_symbol_3 { | ||||
|   float4 color : SV_Target0; | ||||
| }; | ||||
| 
 | ||||
| Output main_inner(Input tint_symbol) { | ||||
|   const Output tint_symbol_4 = {tint_symbol.color}; | ||||
|   return tint_symbol_4; | ||||
| } | ||||
| 
 | ||||
| tint_symbol_3 main(tint_symbol_2 tint_symbol_1) { | ||||
|   const Input tint_symbol_5 = {tint_symbol_1.color}; | ||||
|   const Output inner_result = main_inner(tint_symbol_5); | ||||
|   tint_symbol_3 wrapper_result = (tint_symbol_3)0; | ||||
|   wrapper_result.color = inner_result.color; | ||||
|   return wrapper_result; | ||||
| } | ||||
							
								
								
									
										29
									
								
								test/benchmark/simple_fragment.wgsl.expected.msl
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										29
									
								
								test/benchmark/simple_fragment.wgsl.expected.msl
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,29 @@ | ||||
| #include <metal_stdlib> | ||||
| 
 | ||||
| using namespace metal; | ||||
| struct Input { | ||||
|   float4 color; | ||||
| }; | ||||
| struct Output { | ||||
|   float4 color; | ||||
| }; | ||||
| struct tint_symbol_2 { | ||||
|   float4 color [[user(locn0)]]; | ||||
| }; | ||||
| struct tint_symbol_3 { | ||||
|   float4 color [[color(0)]]; | ||||
| }; | ||||
| 
 | ||||
| Output tint_symbol_inner(Input in) { | ||||
|   Output const tint_symbol_4 = {.color=in.color}; | ||||
|   return tint_symbol_4; | ||||
| } | ||||
| 
 | ||||
| fragment tint_symbol_3 tint_symbol(tint_symbol_2 tint_symbol_1 [[stage_in]]) { | ||||
|   Input const tint_symbol_5 = {.color=tint_symbol_1.color}; | ||||
|   Output const inner_result = tint_symbol_inner(tint_symbol_5); | ||||
|   tint_symbol_3 wrapper_result = {}; | ||||
|   wrapper_result.color = inner_result.color; | ||||
|   return wrapper_result; | ||||
| } | ||||
| 
 | ||||
							
								
								
									
										50
									
								
								test/benchmark/simple_fragment.wgsl.expected.spvasm
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										50
									
								
								test/benchmark/simple_fragment.wgsl.expected.spvasm
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,50 @@ | ||||
| ; SPIR-V | ||||
| ; Version: 1.3 | ||||
| ; Generator: Google Tint Compiler; 0 | ||||
| ; Bound: 24 | ||||
| ; Schema: 0 | ||||
|                OpCapability Shader | ||||
|                OpMemoryModel Logical GLSL450 | ||||
|                OpEntryPoint Fragment %main "main" %color_1 %color_2 | ||||
|                OpExecutionMode %main OriginUpperLeft | ||||
|                OpName %color_1 "color_1" | ||||
|                OpName %color_2 "color_2" | ||||
|                OpName %Output "Output" | ||||
|                OpMemberName %Output 0 "color" | ||||
|                OpName %Input "Input" | ||||
|                OpMemberName %Input 0 "color" | ||||
|                OpName %main_inner "main_inner" | ||||
|                OpName %in "in" | ||||
|                OpName %main "main" | ||||
|                OpDecorate %color_1 Location 0 | ||||
|                OpDecorate %color_2 Location 0 | ||||
|                OpMemberDecorate %Output 0 Offset 0 | ||||
|                OpMemberDecorate %Input 0 Offset 0 | ||||
|       %float = OpTypeFloat 32 | ||||
|     %v4float = OpTypeVector %float 4 | ||||
| %_ptr_Input_v4float = OpTypePointer Input %v4float | ||||
|     %color_1 = OpVariable %_ptr_Input_v4float Input | ||||
| %_ptr_Output_v4float = OpTypePointer Output %v4float | ||||
|           %7 = OpConstantNull %v4float | ||||
|     %color_2 = OpVariable %_ptr_Output_v4float Output %7 | ||||
|      %Output = OpTypeStruct %v4float | ||||
|       %Input = OpTypeStruct %v4float | ||||
|           %8 = OpTypeFunction %Output %Input | ||||
|        %void = OpTypeVoid | ||||
|          %16 = OpTypeFunction %void | ||||
|  %main_inner = OpFunction %Output None %8 | ||||
|          %in = OpFunctionParameter %Input | ||||
|          %13 = OpLabel | ||||
|          %14 = OpCompositeExtract %v4float %in 0 | ||||
|          %15 = OpCompositeConstruct %Output %14 | ||||
|                OpReturnValue %15 | ||||
|                OpFunctionEnd | ||||
|        %main = OpFunction %void None %16 | ||||
|          %19 = OpLabel | ||||
|          %21 = OpLoad %v4float %color_1 | ||||
|          %22 = OpCompositeConstruct %Input %21 | ||||
|          %20 = OpFunctionCall %Output %main_inner %22 | ||||
|          %23 = OpCompositeExtract %v4float %20 0 | ||||
|                OpStore %color_2 %23 | ||||
|                OpReturn | ||||
|                OpFunctionEnd | ||||
							
								
								
									
										14
									
								
								test/benchmark/simple_fragment.wgsl.expected.wgsl
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										14
									
								
								test/benchmark/simple_fragment.wgsl.expected.wgsl
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,14 @@ | ||||
| struct Input { | ||||
|   [[location(0)]] | ||||
|   color : vec4<f32>; | ||||
| }; | ||||
| 
 | ||||
| struct Output { | ||||
|   [[location(0)]] | ||||
|   color : vec4<f32>; | ||||
| }; | ||||
| 
 | ||||
| [[stage(fragment)]] | ||||
| fn main(in : Input) -> Output { | ||||
|   return Output(in.color); | ||||
| } | ||||
							
								
								
									
										12
									
								
								test/benchmark/simple_vertex.wgsl
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										12
									
								
								test/benchmark/simple_vertex.wgsl
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,12 @@ | ||||
| struct Input { | ||||
|   [[location(0)]] position: vec4<f32>; | ||||
| }; | ||||
| 
 | ||||
| struct Output { | ||||
|   [[builtin(position)]] position : vec4<f32>; | ||||
| }; | ||||
| 
 | ||||
| [[stage(vertex)]] | ||||
| fn main(in : Input) -> Output { | ||||
|   return Output(in.position); | ||||
| } | ||||
							
								
								
									
										25
									
								
								test/benchmark/simple_vertex.wgsl.expected.hlsl
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										25
									
								
								test/benchmark/simple_vertex.wgsl.expected.hlsl
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,25 @@ | ||||
| struct Input { | ||||
|   float4 position; | ||||
| }; | ||||
| struct Output { | ||||
|   float4 position; | ||||
| }; | ||||
| struct tint_symbol_2 { | ||||
|   float4 position : TEXCOORD0; | ||||
| }; | ||||
| struct tint_symbol_3 { | ||||
|   float4 position : SV_Position; | ||||
| }; | ||||
| 
 | ||||
| Output main_inner(Input tint_symbol) { | ||||
|   const Output tint_symbol_4 = {tint_symbol.position}; | ||||
|   return tint_symbol_4; | ||||
| } | ||||
| 
 | ||||
| tint_symbol_3 main(tint_symbol_2 tint_symbol_1) { | ||||
|   const Input tint_symbol_5 = {tint_symbol_1.position}; | ||||
|   const Output inner_result = main_inner(tint_symbol_5); | ||||
|   tint_symbol_3 wrapper_result = (tint_symbol_3)0; | ||||
|   wrapper_result.position = inner_result.position; | ||||
|   return wrapper_result; | ||||
| } | ||||
							
								
								
									
										29
									
								
								test/benchmark/simple_vertex.wgsl.expected.msl
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										29
									
								
								test/benchmark/simple_vertex.wgsl.expected.msl
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,29 @@ | ||||
| #include <metal_stdlib> | ||||
| 
 | ||||
| using namespace metal; | ||||
| struct Input { | ||||
|   float4 position; | ||||
| }; | ||||
| struct Output { | ||||
|   float4 position; | ||||
| }; | ||||
| struct tint_symbol_2 { | ||||
|   float4 position [[attribute(0)]]; | ||||
| }; | ||||
| struct tint_symbol_3 { | ||||
|   float4 position [[position]]; | ||||
| }; | ||||
| 
 | ||||
| Output tint_symbol_inner(Input in) { | ||||
|   Output const tint_symbol_4 = {.position=in.position}; | ||||
|   return tint_symbol_4; | ||||
| } | ||||
| 
 | ||||
| vertex tint_symbol_3 tint_symbol(tint_symbol_2 tint_symbol_1 [[stage_in]]) { | ||||
|   Input const tint_symbol_5 = {.position=tint_symbol_1.position}; | ||||
|   Output const inner_result = tint_symbol_inner(tint_symbol_5); | ||||
|   tint_symbol_3 wrapper_result = {}; | ||||
|   wrapper_result.position = inner_result.position; | ||||
|   return wrapper_result; | ||||
| } | ||||
| 
 | ||||
							
								
								
									
										56
									
								
								test/benchmark/simple_vertex.wgsl.expected.spvasm
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										56
									
								
								test/benchmark/simple_vertex.wgsl.expected.spvasm
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,56 @@ | ||||
| ; SPIR-V | ||||
| ; Version: 1.3 | ||||
| ; Generator: Google Tint Compiler; 0 | ||||
| ; Bound: 28 | ||||
| ; Schema: 0 | ||||
|                OpCapability Shader | ||||
|                OpMemoryModel Logical GLSL450 | ||||
|                OpEntryPoint Vertex %main "main" %position_1 %position_2 %vertex_point_size | ||||
|                OpName %position_1 "position_1" | ||||
|                OpName %position_2 "position_2" | ||||
|                OpName %vertex_point_size "vertex_point_size" | ||||
|                OpName %Output "Output" | ||||
|                OpMemberName %Output 0 "position" | ||||
|                OpName %Input "Input" | ||||
|                OpMemberName %Input 0 "position" | ||||
|                OpName %main_inner "main_inner" | ||||
|                OpName %in "in" | ||||
|                OpName %main "main" | ||||
|                OpDecorate %position_1 Location 0 | ||||
|                OpDecorate %position_2 BuiltIn Position | ||||
|                OpDecorate %vertex_point_size BuiltIn PointSize | ||||
|                OpMemberDecorate %Output 0 Offset 0 | ||||
|                OpMemberDecorate %Input 0 Offset 0 | ||||
|       %float = OpTypeFloat 32 | ||||
|     %v4float = OpTypeVector %float 4 | ||||
| %_ptr_Input_v4float = OpTypePointer Input %v4float | ||||
|  %position_1 = OpVariable %_ptr_Input_v4float Input | ||||
| %_ptr_Output_v4float = OpTypePointer Output %v4float | ||||
|           %7 = OpConstantNull %v4float | ||||
|  %position_2 = OpVariable %_ptr_Output_v4float Output %7 | ||||
| %_ptr_Output_float = OpTypePointer Output %float | ||||
|          %10 = OpConstantNull %float | ||||
| %vertex_point_size = OpVariable %_ptr_Output_float Output %10 | ||||
|      %Output = OpTypeStruct %v4float | ||||
|       %Input = OpTypeStruct %v4float | ||||
|          %11 = OpTypeFunction %Output %Input | ||||
|        %void = OpTypeVoid | ||||
|          %19 = OpTypeFunction %void | ||||
|     %float_1 = OpConstant %float 1 | ||||
|  %main_inner = OpFunction %Output None %11 | ||||
|          %in = OpFunctionParameter %Input | ||||
|          %16 = OpLabel | ||||
|          %17 = OpCompositeExtract %v4float %in 0 | ||||
|          %18 = OpCompositeConstruct %Output %17 | ||||
|                OpReturnValue %18 | ||||
|                OpFunctionEnd | ||||
|        %main = OpFunction %void None %19 | ||||
|          %22 = OpLabel | ||||
|          %24 = OpLoad %v4float %position_1 | ||||
|          %25 = OpCompositeConstruct %Input %24 | ||||
|          %23 = OpFunctionCall %Output %main_inner %25 | ||||
|          %26 = OpCompositeExtract %v4float %23 0 | ||||
|                OpStore %position_2 %26 | ||||
|                OpStore %vertex_point_size %float_1 | ||||
|                OpReturn | ||||
|                OpFunctionEnd | ||||
							
								
								
									
										14
									
								
								test/benchmark/simple_vertex.wgsl.expected.wgsl
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										14
									
								
								test/benchmark/simple_vertex.wgsl.expected.wgsl
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,14 @@ | ||||
| struct Input { | ||||
|   [[location(0)]] | ||||
|   position : vec4<f32>; | ||||
| }; | ||||
| 
 | ||||
| struct Output { | ||||
|   [[builtin(position)]] | ||||
|   position : vec4<f32>; | ||||
| }; | ||||
| 
 | ||||
| [[stage(vertex)]] | ||||
| fn main(in : Input) -> Output { | ||||
|   return Output(in.position); | ||||
| } | ||||
							
								
								
									
										5
									
								
								third_party/CMakeLists.txt
									
									
									
									
										vendored
									
									
								
							
							
						
						
									
										5
									
								
								third_party/CMakeLists.txt
									
									
									
									
										vendored
									
									
								
							| @ -12,6 +12,11 @@ | ||||
| # See the License for the specific language governing permissions and | ||||
| # limitations under the License. | ||||
| 
 | ||||
| if (${TINT_BUILD_BENCHMARKS}) | ||||
|   set(BENCHMARK_ENABLE_TESTING FALSE CACHE BOOL FALSE FORCE) | ||||
|   add_subdirectory(${CMAKE_CURRENT_SOURCE_DIR}/benchmark EXCLUDE_FROM_ALL) | ||||
| endif() | ||||
| 
 | ||||
| if (${TINT_BUILD_TESTS} AND NOT TARGET gmock) | ||||
|   set(gtest_force_shared_crt ON CACHE BOOL "Controls whether a shared run-time library should be used even when Google Test is built as static library" FORCE) | ||||
|   add_subdirectory(${CMAKE_CURRENT_SOURCE_DIR}/googletest EXCLUDE_FROM_ALL) | ||||
|  | ||||
							
								
								
									
										33
									
								
								tools/benchdiff
									
									
									
									
									
										Executable file
									
								
							
							
						
						
									
										33
									
								
								tools/benchdiff
									
									
									
									
									
										Executable file
									
								
							| @ -0,0 +1,33 @@ | ||||
| #!/usr/bin/env bash | ||||
| # Copyright 2022 The Tint Authors | ||||
| # | ||||
| # Licensed under the Apache License, Version 2.0 (the "License"); | ||||
| # you may not use this file except in compliance with the License. | ||||
| # You may obtain a copy of the License at | ||||
| # | ||||
| #     http://www.apache.org/licenses/LICENSE-2.0 | ||||
| # | ||||
| # Unless required by applicable law or agreed to in writing, software | ||||
| # distributed under the License is distributed on an "AS IS" BASIS, | ||||
| # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||||
| # See the License for the specific language governing permissions and | ||||
| # limitations under the License. | ||||
| 
 | ||||
| set -e # Fail on any error. | ||||
| 
 | ||||
| if [ ! -x "$(which go)" ] ; then | ||||
|     echo "error: go needs to be on \$PATH to use $0" | ||||
|     exit 1 | ||||
| fi | ||||
| 
 | ||||
| SCRIPT_DIR="$( cd "$( dirname "${BASH_SOURCE[0]}")" >/dev/null 2>&1 && pwd )" | ||||
| ROOT_DIR="$( cd "${SCRIPT_DIR}/.." >/dev/null 2>&1 && pwd )" | ||||
| BINARY="${SCRIPT_DIR}/bin/benchdiff" | ||||
| 
 | ||||
| # Rebuild the binary. | ||||
| # Note, go caches build artifacts, so this is quick for repeat calls | ||||
| pushd "${SCRIPT_DIR}/src/cmd/benchdiff" > /dev/null | ||||
|     go build -o "${BINARY}" main.go | ||||
| popd > /dev/null | ||||
| 
 | ||||
| "${BINARY}" "$@" | ||||
							
								
								
									
										150
									
								
								tools/src/bench/bench.go
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										150
									
								
								tools/src/bench/bench.go
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,150 @@ | ||||
| // Copyright 2022 The Tint Authors | ||||
| // | ||||
| // Licensed under the Apache License, Version 2.0 (the "License"); | ||||
| // you may not use this file except in compliance with the License. | ||||
| // You may obtain a copy of the License at | ||||
| // | ||||
| //     https://www.apache.org/licenses/LICENSE-2.0 | ||||
| // | ||||
| // Unless required by applicable law or agreed to in writing, software | ||||
| // distributed under the License is distributed on an "AS IS" BASIS, | ||||
| // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||||
| // See the License for the specific language governing permissions and | ||||
| // limitations under the License. | ||||
| 
 | ||||
| // Package bench provides types and methods for parsing Google benchmark results. | ||||
| package bench | ||||
| 
 | ||||
| import ( | ||||
| 	"encoding/json" | ||||
| 	"errors" | ||||
| 	"fmt" | ||||
| 	"regexp" | ||||
| 	"strconv" | ||||
| 	"strings" | ||||
| 	"time" | ||||
| ) | ||||
| 
 | ||||
| // Test holds the results of a single benchmark test. | ||||
| type Test struct { | ||||
| 	Name       string | ||||
| 	NumTasks   uint | ||||
| 	NumThreads uint | ||||
| 	Duration   time.Duration | ||||
| 	Iterations uint | ||||
| } | ||||
| 
 | ||||
| var testVarRE = regexp.MustCompile(`([\w])+:([0-9]+)`) | ||||
| 
 | ||||
| func (t *Test) parseName() { | ||||
| 	for _, match := range testVarRE.FindAllStringSubmatch(t.Name, -1) { | ||||
| 		if len(match) != 3 { | ||||
| 			continue | ||||
| 		} | ||||
| 		n, err := strconv.Atoi(match[2]) | ||||
| 		if err != nil { | ||||
| 			continue | ||||
| 		} | ||||
| 		switch match[1] { | ||||
| 		case "threads": | ||||
| 			t.NumThreads = uint(n) | ||||
| 		case "tasks": | ||||
| 			t.NumTasks = uint(n) | ||||
| 		} | ||||
| 	} | ||||
| } | ||||
| 
 | ||||
| // Benchmark holds a set of benchmark test results. | ||||
| type Benchmark struct { | ||||
| 	Tests []Test | ||||
| } | ||||
| 
 | ||||
| // Parse parses the benchmark results from the string s. | ||||
| // Parse will handle the json and 'console' formats. | ||||
| func Parse(s string) (Benchmark, error) { | ||||
| 	type Parser = func(s string) (Benchmark, error) | ||||
| 	for _, parser := range []Parser{parseConsole, parseJSON} { | ||||
| 		b, err := parser(s) | ||||
| 		switch err { | ||||
| 		case nil: | ||||
| 			return b, nil | ||||
| 		case errWrongFormat: | ||||
| 		default: | ||||
| 			return Benchmark{}, err | ||||
| 		} | ||||
| 	} | ||||
| 
 | ||||
| 	return Benchmark{}, errors.New("Unrecognised file format") | ||||
| } | ||||
| 
 | ||||
| var errWrongFormat = errors.New("Wrong format") | ||||
| var consoleLineRE = regexp.MustCompile(`([\w/:]+)\s+([0-9]+(?:.[0-9]+)?) ns\s+[0-9]+(?:.[0-9]+) ns\s+([0-9]+)`) | ||||
| 
 | ||||
| func parseConsole(s string) (Benchmark, error) { | ||||
| 	blocks := strings.Split(s, "------------------------------------------------------------------------------------------") | ||||
| 	if len(blocks) != 3 { | ||||
| 		return Benchmark{}, errWrongFormat | ||||
| 	} | ||||
| 
 | ||||
| 	lines := strings.Split(blocks[2], "\n") | ||||
| 	b := Benchmark{ | ||||
| 		Tests: make([]Test, 0, len(lines)), | ||||
| 	} | ||||
| 	for _, line := range lines { | ||||
| 		if len(line) == 0 { | ||||
| 			continue | ||||
| 		} | ||||
| 		matches := consoleLineRE.FindStringSubmatch(line) | ||||
| 		if len(matches) != 4 { | ||||
| 			return Benchmark{}, fmt.Errorf("Unable to parse the line:\n" + line) | ||||
| 		} | ||||
| 		ns, err := strconv.ParseFloat(matches[2], 64) | ||||
| 		if err != nil { | ||||
| 			return Benchmark{}, fmt.Errorf("Unable to parse the duration: " + matches[2]) | ||||
| 		} | ||||
| 		iterations, err := strconv.Atoi(matches[3]) | ||||
| 		if err != nil { | ||||
| 			return Benchmark{}, fmt.Errorf("Unable to parse the number of iterations: " + matches[3]) | ||||
| 		} | ||||
| 
 | ||||
| 		t := Test{ | ||||
| 			Name:       matches[1], | ||||
| 			Duration:   time.Nanosecond * time.Duration(ns), | ||||
| 			Iterations: uint(iterations), | ||||
| 		} | ||||
| 		t.parseName() | ||||
| 		b.Tests = append(b.Tests, t) | ||||
| 	} | ||||
| 	return b, nil | ||||
| } | ||||
| 
 | ||||
| func parseJSON(s string) (Benchmark, error) { | ||||
| 	type T struct { | ||||
| 		Name       string  `json:"name"` | ||||
| 		Iterations uint    `json:"iterations"` | ||||
| 		Time       float64 `json:"real_time"` | ||||
| 	} | ||||
| 	type B struct { | ||||
| 		Tests []T `json:"benchmarks"` | ||||
| 	} | ||||
| 	b := B{} | ||||
| 	d := json.NewDecoder(strings.NewReader(s)) | ||||
| 	if err := d.Decode(&b); err != nil { | ||||
| 		return Benchmark{}, err | ||||
| 	} | ||||
| 
 | ||||
| 	out := Benchmark{ | ||||
| 		Tests: make([]Test, len(b.Tests)), | ||||
| 	} | ||||
| 	for i, test := range b.Tests { | ||||
| 		t := Test{ | ||||
| 			Name:       test.Name, | ||||
| 			Duration:   time.Nanosecond * time.Duration(int64(test.Time)), | ||||
| 			Iterations: test.Iterations, | ||||
| 		} | ||||
| 		t.parseName() | ||||
| 		out.Tests[i] = t | ||||
| 	} | ||||
| 
 | ||||
| 	return out, nil | ||||
| } | ||||
							
								
								
									
										177
									
								
								tools/src/cmd/benchdiff/main.go
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										177
									
								
								tools/src/cmd/benchdiff/main.go
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,177 @@ | ||||
| // Copyright 2022 The Tint Authors. | ||||
| // | ||||
| // Licensed under the Apache License, Version 2.0 (the "License"); | ||||
| // you may not use this file except in compliance with the License. | ||||
| // You may obtain a copy of the License at | ||||
| // | ||||
| //     https://www.apache.org/licenses/LICENSE-2.0 | ||||
| // | ||||
| // Unless required by applicable law or agreed to in writing, software | ||||
| // distributed under the License is distributed on an "AS IS" BASIS, | ||||
| // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||||
| // See the License for the specific language governing permissions and | ||||
| // limitations under the License. | ||||
| 
 | ||||
| // benchdiff is a tool that compares two Google benchmark results and displays | ||||
| // sorted performance differences. | ||||
| package main | ||||
| 
 | ||||
| import ( | ||||
| 	"errors" | ||||
| 	"flag" | ||||
| 	"fmt" | ||||
| 	"io/ioutil" | ||||
| 	"os" | ||||
| 	"path/filepath" | ||||
| 	"sort" | ||||
| 	"strings" | ||||
| 	"text/tabwriter" | ||||
| 	"time" | ||||
| 
 | ||||
| 	"dawn.googlesource.com/tint/tools/src/bench" | ||||
| ) | ||||
| 
 | ||||
| var ( | ||||
| 	minDiff    = flag.Duration("min-diff", time.Microsecond*10, "Filter away time diffs less than this duration") | ||||
| 	minRelDiff = flag.Float64("min-rel-diff", 0.01, "Filter away absolute relative diffs between [1, 1+x]") | ||||
| ) | ||||
| 
 | ||||
| func main() { | ||||
| 	flag.ErrHelp = errors.New("benchdiff is a tool to compare two benchmark results") | ||||
| 	flag.Parse() | ||||
| 	flag.Usage = func() { | ||||
| 		fmt.Fprintln(os.Stderr, "benchdiff <benchmark-a> <benchmark-b>") | ||||
| 		flag.PrintDefaults() | ||||
| 	} | ||||
| 
 | ||||
| 	args := flag.Args() | ||||
| 	if len(args) < 2 { | ||||
| 		flag.Usage() | ||||
| 		os.Exit(1) | ||||
| 	} | ||||
| 
 | ||||
| 	pathA, pathB := args[0], args[1] | ||||
| 
 | ||||
| 	if err := run(pathA, pathB); err != nil { | ||||
| 		fmt.Fprintln(os.Stderr, err) | ||||
| 		os.Exit(-1) | ||||
| 	} | ||||
| } | ||||
| 
 | ||||
| func run(pathA, pathB string) error { | ||||
| 	fileA, err := ioutil.ReadFile(pathA) | ||||
| 	if err != nil { | ||||
| 		return err | ||||
| 	} | ||||
| 	benchA, err := bench.Parse(string(fileA)) | ||||
| 	if err != nil { | ||||
| 		return err | ||||
| 	} | ||||
| 
 | ||||
| 	fileB, err := ioutil.ReadFile(pathB) | ||||
| 	if err != nil { | ||||
| 		return err | ||||
| 	} | ||||
| 	benchB, err := bench.Parse(string(fileB)) | ||||
| 	if err != nil { | ||||
| 		return err | ||||
| 	} | ||||
| 
 | ||||
| 	compare(benchA, benchB, fileName(pathA), fileName(pathB)) | ||||
| 
 | ||||
| 	return nil | ||||
| } | ||||
| 
 | ||||
| func fileName(path string) string { | ||||
| 	_, name := filepath.Split(path) | ||||
| 	return name | ||||
| } | ||||
| 
 | ||||
| func compare(benchA, benchB bench.Benchmark, nameA, nameB string) { | ||||
| 	type times struct { | ||||
| 		a time.Duration | ||||
| 		b time.Duration | ||||
| 	} | ||||
| 	byName := map[string]times{} | ||||
| 	for _, test := range benchA.Tests { | ||||
| 		byName[test.Name] = times{a: test.Duration} | ||||
| 	} | ||||
| 	for _, test := range benchB.Tests { | ||||
| 		t := byName[test.Name] | ||||
| 		t.b = test.Duration | ||||
| 		byName[test.Name] = t | ||||
| 	} | ||||
| 
 | ||||
| 	type delta struct { | ||||
| 		name       string | ||||
| 		times      times | ||||
| 		relDiff    float64 | ||||
| 		absRelDiff float64 | ||||
| 	} | ||||
| 	deltas := []delta{} | ||||
| 	for name, times := range byName { | ||||
| 		if times.a == 0 || times.b == 0 { | ||||
| 			continue // Assuming test was missing from a or b | ||||
| 		} | ||||
| 		diff := times.b - times.a | ||||
| 		absDiff := diff | ||||
| 		if absDiff < 0 { | ||||
| 			absDiff = -absDiff | ||||
| 		} | ||||
| 		if absDiff < *minDiff { | ||||
| 			continue | ||||
| 		} | ||||
| 
 | ||||
| 		relDiff := float64(times.b) / float64(times.a) | ||||
| 		absRelDiff := relDiff | ||||
| 		if absRelDiff < 1 { | ||||
| 			absRelDiff = 1.0 / absRelDiff | ||||
| 		} | ||||
| 		if absRelDiff < (1.0 + *minRelDiff) { | ||||
| 			continue | ||||
| 		} | ||||
| 
 | ||||
| 		d := delta{ | ||||
| 			name:       name, | ||||
| 			times:      times, | ||||
| 			relDiff:    relDiff, | ||||
| 			absRelDiff: absRelDiff, | ||||
| 		} | ||||
| 		deltas = append(deltas, d) | ||||
| 	} | ||||
| 
 | ||||
| 	sort.Slice(deltas, func(i, j int) bool { return deltas[j].relDiff < deltas[i].relDiff }) | ||||
| 
 | ||||
| 	fmt.Println("A:", nameA) | ||||
| 	fmt.Println("B:", nameB) | ||||
| 	fmt.Println() | ||||
| 
 | ||||
| 	buf := strings.Builder{} | ||||
| 	{ | ||||
| 		w := tabwriter.NewWriter(&buf, 1, 1, 0, ' ', 0) | ||||
| 		fmt.Fprintln(w, "Test name\t | Δ (A → B)\t | % (A → B)\t | % (B → A)\t | × (A → B)\t | × (B → A)\t | A \t | B") | ||||
| 		fmt.Fprintln(w, "\t-+\t-+\t-+\t-+\t-+\t-+\t-+\t-") | ||||
| 		for _, delta := range deltas { | ||||
| 			a2b := delta.times.b - delta.times.a | ||||
| 			fmt.Fprintf(w, "%v \t | %v \t | %+2.1f%% \t | %+2.1f%% \t | %+.4f \t | %+.4f \t | %v \t | %v \t|\n", | ||||
| 				delta.name, | ||||
| 				a2b, // Δ (A → B) | ||||
| 				100*float64(a2b)/float64(delta.times.a),       // % (A → B) | ||||
| 				100*float64(-a2b)/float64(delta.times.b),      // % (B → A) | ||||
| 				float64(delta.times.b)/float64(delta.times.a), // × (A → B) | ||||
| 				float64(delta.times.a)/float64(delta.times.b), // × (B → A) | ||||
| 				delta.times.a, // A | ||||
| 				delta.times.b, // B | ||||
| 			) | ||||
| 		} | ||||
| 		w.Flush() | ||||
| 	} | ||||
| 
 | ||||
| 	// Split the table by line so we can add in a header line | ||||
| 	lines := strings.Split(buf.String(), "\n") | ||||
| 	fmt.Println(lines[0]) | ||||
| 	fmt.Println(strings.ReplaceAll(lines[1], " ", "-")) | ||||
| 	for _, l := range lines[2:] { | ||||
| 		fmt.Println(l) | ||||
| 	} | ||||
| } | ||||
		Loading…
	
	
			
			x
			
			
		
	
		Reference in New Issue
	
	Block a user