//===-- Common utility class for differential analysis --------------------===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // //===----------------------------------------------------------------------===// #include "src/__support/CPP/algorithm.h" #include "src/__support/FPUtil/FPBits.h" #include "src/__support/macros/config.h" #include "test/src/math/performance_testing/Timer.h" #include #include namespace LIBC_NAMESPACE_DECL { namespace testing { template class BinaryOpSingleOutputPerf { using FPBits = fputil::FPBits; using StorageType = typename FPBits::StorageType; static constexpr StorageType UIntMax = cpp::numeric_limits::max(); public: typedef OutputType Func(InputType, InputType); static void run_perf_in_range(Func myFunc, Func otherFunc, StorageType startingBit, StorageType endingBit, size_t N, size_t rounds, std::ofstream &log) { if (sizeof(StorageType) <= sizeof(size_t)) N = cpp::min(N, static_cast(endingBit - startingBit)); auto runner = [=](Func func) { [[maybe_unused]] volatile OutputType result; if (endingBit < startingBit) { return; } StorageType step = (endingBit - startingBit) / N; for (size_t i = 0; i < rounds; i++) { for (StorageType bitsX = startingBit, bitsY = endingBit;; bitsX += step, bitsY -= step) { InputType x = FPBits(bitsX).get_val(); InputType y = FPBits(bitsY).get_val(); result = func(x, y); if (endingBit - bitsX < step) { break; } } } }; Timer timer; timer.start(); runner(myFunc); timer.stop(); double my_average = static_cast(timer.nanoseconds()) / N / rounds; log << "-- My function --\n"; log << " Total time : " << timer.nanoseconds() << " ns \n"; log << " Average runtime : " << my_average << " ns/op \n"; log << " Ops per second : " << static_cast(1'000'000'000.0 / my_average) << " op/s \n"; timer.start(); runner(otherFunc); timer.stop(); double other_average = static_cast(timer.nanoseconds()) / N / rounds; log << "-- Other function --\n"; log << " Total time : " << timer.nanoseconds() << " ns \n"; log << " Average runtime : " << other_average << " ns/op \n"; log << " Ops per second : " << static_cast(1'000'000'000.0 / other_average) << " op/s \n"; log << "-- Average runtime ratio --\n"; log << " Mine / Other's : " << my_average / other_average << " \n"; } static void run_perf(Func myFunc, Func otherFunc, int rounds, const char *logFile) { std::ofstream log(logFile); log << " Performance tests with inputs in denormal range:\n"; run_perf_in_range(myFunc, otherFunc, /* startingBit= */ StorageType(0), /* endingBit= */ FPBits::max_subnormal().uintval(), 1'000'001, rounds, log); log << "\n Performance tests with inputs in normal range:\n"; run_perf_in_range(myFunc, otherFunc, /* startingBit= */ FPBits::min_normal().uintval(), /* endingBit= */ FPBits::max_normal().uintval(), 1'000'001, rounds, log); log << "\n Performance tests with inputs in normal range with exponents " "close to each other:\n"; run_perf_in_range( myFunc, otherFunc, /* startingBit= */ FPBits(OutputType(0x1.0p-10)).uintval(), /* endingBit= */ FPBits(OutputType(0x1.0p+10)).uintval(), 1'000'001, rounds, log); } static void run_diff(Func myFunc, Func otherFunc, const char *logFile) { uint64_t diffCount = 0; std::ofstream log(logFile); log << " Diff tests with inputs in denormal range:\n"; diffCount += run_diff_in_range( myFunc, otherFunc, /* startingBit= */ StorageType(0), /* endingBit= */ FPBits::max_subnormal().uintval(), 1'000'001, log); log << "\n Diff tests with inputs in normal range:\n"; diffCount += run_diff_in_range( myFunc, otherFunc, /* startingBit= */ FPBits::min_normal().uintval(), /* endingBit= */ FPBits::max_normal().uintval(), 100'000'001, log); log << "\n Diff tests with inputs in normal range with exponents " "close to each other:\n"; diffCount += run_diff_in_range( myFunc, otherFunc, /* startingBit= */ FPBits(OutputType(0x1.0p-10)).uintval(), /* endingBit= */ FPBits(OutputType(0x1.0p+10)).uintval(), 10'000'001, log); log << "Total number of differing results: " << diffCount << '\n'; } }; } // namespace testing } // namespace LIBC_NAMESPACE_DECL #define BINARY_OP_SINGLE_OUTPUT_PERF(OutputType, InputType, myFunc, otherFunc, \ filename) \ int main() { \ LIBC_NAMESPACE::testing::BinaryOpSingleOutputPerf< \ OutputType, InputType>::run_perf(&myFunc, &otherFunc, 1, filename); \ return 0; \ } #define BINARY_OP_SINGLE_OUTPUT_PERF_EX(OutputType, InputType, myFunc, \ otherFunc, rounds, filename) \ { \ LIBC_NAMESPACE::testing::BinaryOpSingleOutputPerf< \ OutputType, InputType>::run_perf(&myFunc, &otherFunc, rounds, \ filename); \ LIBC_NAMESPACE::testing::BinaryOpSingleOutputPerf< \ OutputType, InputType>::run_perf(&myFunc, &otherFunc, rounds, \ filename); \ }