libc/test/src/math/performance_testing/BinaryOpSingleOutputPerf.h - llvm-project - Git at Google

 //===-- Common utility class for differential analysis --------------------===//
 //
 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
 // See https://llvm.org/LICENSE.txt for license information.
 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
 //
 //===----------------------------------------------------------------------===//

 #include "src/__support/CPP/algorithm.h"
 #include "src/__support/FPUtil/FPBits.h"
 #include "src/__support/macros/config.h"
 #include "test/src/math/performance_testing/Timer.h"

 #include <cstddef>
 #include <fstream>

 namespace LIBC_NAMESPACE_DECL {
 namespace testing {
 template <typename OutputType, typename InputType>
 class BinaryOpSingleOutputPerf {
   using FPBits = fputil::FPBits<OutputType>;
   using StorageType = typename FPBits::StorageType;
   static constexpr StorageType UIntMax =
       cpp::numeric_limits<StorageType>::max();

 public:
   typedef OutputType Func(InputType, InputType);

   static void run_perf_in_range(Func myFunc, Func otherFunc,
                                 StorageType startingBit, StorageType endingBit,
                                 size_t N, size_t rounds, std::ofstream &log) {
     if (sizeof(StorageType) <= sizeof(size_t))
       N = cpp::min(N, static_cast<size_t>(endingBit - startingBit));

     auto runner = [=](Func func) {
       [[maybe_unused]] volatile OutputType result;
       if (endingBit < startingBit) {
         return;
       }

       StorageType step = (endingBit - startingBit) / N;
       for (size_t i = 0; i < rounds; i++) {
         for (StorageType bitsX = startingBit, bitsY = endingBit;;
              bitsX += step, bitsY -= step) {
           InputType x = FPBits(bitsX).get_val();
           InputType y = FPBits(bitsY).get_val();
           result = func(x, y);
           if (endingBit - bitsX < step) {
             break;
           }
         }
       }
     };

     Timer timer;
     timer.start();
     runner(myFunc);
     timer.stop();

     double my_average = static_cast<double>(timer.nanoseconds()) / N / rounds;
     log << "-- My function --\n";
     log << "     Total time      : " << timer.nanoseconds() << " ns \n";
     log << "     Average runtime : " << my_average << " ns/op \n";
     log << "     Ops per second  : "
         << static_cast<uint64_t>(1'000'000'000.0 / my_average) << " op/s \n";

     timer.start();
     runner(otherFunc);
     timer.stop();

     double other_average =
         static_cast<double>(timer.nanoseconds()) / N / rounds;
     log << "-- Other function --\n";
     log << "     Total time      : " << timer.nanoseconds() << " ns \n";
     log << "     Average runtime : " << other_average << " ns/op \n";
     log << "     Ops per second  : "
         << static_cast<uint64_t>(1'000'000'000.0 / other_average) << " op/s \n";

     log << "-- Average runtime ratio --\n";
     log << "     Mine / Other's  : " << my_average / other_average << " \n";
   }

   static void run_perf(Func myFunc, Func otherFunc, int rounds,
                        const char *logFile) {
     std::ofstream log(logFile);
     log << " Performance tests with inputs in denormal range:\n";
     run_perf_in_range(myFunc, otherFunc, /* startingBit= */ StorageType(0),
                       /* endingBit= */ FPBits::max_subnormal().uintval(),
                       1'000'001, rounds, log);
     log << "\n Performance tests with inputs in normal range:\n";
     run_perf_in_range(myFunc, otherFunc,
                       /* startingBit= */ FPBits::min_normal().uintval(),
                       /* endingBit= */ FPBits::max_normal().uintval(),
                       1'000'001, rounds, log);
     log << "\n Performance tests with inputs in normal range with exponents "
            "close to each other:\n";
     run_perf_in_range(
         myFunc, otherFunc,
         /* startingBit= */ FPBits(OutputType(0x1.0p-10)).uintval(),
         /* endingBit= */ FPBits(OutputType(0x1.0p+10)).uintval(), 1'000'001,
         rounds, log);
   }

   static void run_diff(Func myFunc, Func otherFunc, const char *logFile) {
     uint64_t diffCount = 0;
     std::ofstream log(logFile);
     log << " Diff tests with inputs in denormal range:\n";
     diffCount += run_diff_in_range(
         myFunc, otherFunc, /* startingBit= */ StorageType(0),
         /* endingBit= */ FPBits::max_subnormal().uintval(), 1'000'001, log);
     log << "\n Diff tests with inputs in normal range:\n";
     diffCount += run_diff_in_range(
         myFunc, otherFunc,
         /* startingBit= */ FPBits::min_normal().uintval(),
         /* endingBit= */ FPBits::max_normal().uintval(), 100'000'001, log);
     log << "\n Diff tests with inputs in normal range with exponents "
            "close to each other:\n";
     diffCount += run_diff_in_range(
         myFunc, otherFunc,
         /* startingBit= */ FPBits(OutputType(0x1.0p-10)).uintval(),
         /* endingBit= */ FPBits(OutputType(0x1.0p+10)).uintval(), 10'000'001,
         log);

     log << "Total number of differing results: " << diffCount << '\n';
   }
 };

 } // namespace testing
 } // namespace LIBC_NAMESPACE_DECL

 #define BINARY_OP_SINGLE_OUTPUT_PERF(OutputType, InputType, myFunc, otherFunc, \
                                      filename)                                 \
   int main() {                                                                 \
     LIBC_NAMESPACE::testing::BinaryOpSingleOutputPerf<                         \
         OutputType, InputType>::run_perf(&myFunc, &otherFunc, 1, filename);    \
     return 0;                                                                  \
   }

 #define BINARY_OP_SINGLE_OUTPUT_PERF_EX(OutputType, InputType, myFunc,         \
                                         otherFunc, rounds, filename)           \
   {                                                                            \
     LIBC_NAMESPACE::testing::BinaryOpSingleOutputPerf<                         \
         OutputType, InputType>::run_perf(&myFunc, &otherFunc, rounds,          \
                                          filename);                            \
     LIBC_NAMESPACE::testing::BinaryOpSingleOutputPerf<                         \
         OutputType, InputType>::run_perf(&myFunc, &otherFunc, rounds,          \
                                          filename);                            \
   }
	//===-- Common utility class for differential analysis --------------------===//
	//
	// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
	// See https://llvm.org/LICENSE.txt for license information.
	// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
	//
	//===----------------------------------------------------------------------===//

	#include "src/__support/CPP/algorithm.h"
	#include "src/__support/FPUtil/FPBits.h"
	#include "src/__support/macros/config.h"
	#include "test/src/math/performance_testing/Timer.h"

	#include <cstddef>
	#include <fstream>

	namespace LIBC_NAMESPACE_DECL {
	namespace testing {
	template <typename OutputType, typename InputType>
	class BinaryOpSingleOutputPerf {
	using FPBits = fputil::FPBits<OutputType>;
	using StorageType = typename FPBits::StorageType;
	static constexpr StorageType UIntMax =
	cpp::numeric_limits<StorageType>::max();

	public:
	typedef OutputType Func(InputType, InputType);

	static void run_perf_in_range(Func myFunc, Func otherFunc,
	StorageType startingBit, StorageType endingBit,
	size_t N, size_t rounds, std::ofstream &log) {
	if (sizeof(StorageType) <= sizeof(size_t))
	N = cpp::min(N, static_cast<size_t>(endingBit - startingBit));

	auto runner = [=](Func func) {
	[[maybe_unused]] volatile OutputType result;
	if (endingBit < startingBit) {
	return;
	}

	StorageType step = (endingBit - startingBit) / N;
	for (size_t i = 0; i < rounds; i++) {
	for (StorageType bitsX = startingBit, bitsY = endingBit;;
	bitsX += step, bitsY -= step) {
	InputType x = FPBits(bitsX).get_val();
	InputType y = FPBits(bitsY).get_val();
	result = func(x, y);
	if (endingBit - bitsX < step) {
	break;
	}
	}
	}
	};

	Timer timer;
	timer.start();
	runner(myFunc);
	timer.stop();

	double my_average = static_cast<double>(timer.nanoseconds()) / N / rounds;
	log << "-- My function --\n";
	log << " Total time : " << timer.nanoseconds() << " ns \n";
	log << " Average runtime : " << my_average << " ns/op \n";
	log << " Ops per second : "
	<< static_cast<uint64_t>(1'000'000'000.0 / my_average) << " op/s \n";

	timer.start();
	runner(otherFunc);
	timer.stop();

	double other_average =
	static_cast<double>(timer.nanoseconds()) / N / rounds;
	log << "-- Other function --\n";
	log << " Total time : " << timer.nanoseconds() << " ns \n";
	log << " Average runtime : " << other_average << " ns/op \n";
	log << " Ops per second : "
	<< static_cast<uint64_t>(1'000'000'000.0 / other_average) << " op/s \n";

	log << "-- Average runtime ratio --\n";
	log << " Mine / Other's : " << my_average / other_average << " \n";
	}

	static void run_perf(Func myFunc, Func otherFunc, int rounds,
	const char *logFile) {
	std::ofstream log(logFile);
	log << " Performance tests with inputs in denormal range:\n";
	run_perf_in_range(myFunc, otherFunc, /* startingBit= */ StorageType(0),
	/* endingBit= */ FPBits::max_subnormal().uintval(),
	1'000'001, rounds, log);
	log << "\n Performance tests with inputs in normal range:\n";
	run_perf_in_range(myFunc, otherFunc,
	/* startingBit= */ FPBits::min_normal().uintval(),
	/* endingBit= */ FPBits::max_normal().uintval(),
	1'000'001, rounds, log);
	log << "\n Performance tests with inputs in normal range with exponents "
	"close to each other:\n";
	run_perf_in_range(
	myFunc, otherFunc,
	/* startingBit= */ FPBits(OutputType(0x1.0p-10)).uintval(),
	/* endingBit= */ FPBits(OutputType(0x1.0p+10)).uintval(), 1'000'001,
	rounds, log);
	}

	static void run_diff(Func myFunc, Func otherFunc, const char *logFile) {
	uint64_t diffCount = 0;
	std::ofstream log(logFile);
	log << " Diff tests with inputs in denormal range:\n";
	diffCount += run_diff_in_range(
	myFunc, otherFunc, /* startingBit= */ StorageType(0),
	/* endingBit= */ FPBits::max_subnormal().uintval(), 1'000'001, log);
	log << "\n Diff tests with inputs in normal range:\n";
	diffCount += run_diff_in_range(
	myFunc, otherFunc,
	/* startingBit= */ FPBits::min_normal().uintval(),
	/* endingBit= */ FPBits::max_normal().uintval(), 100'000'001, log);
	log << "\n Diff tests with inputs in normal range with exponents "
	"close to each other:\n";
	diffCount += run_diff_in_range(
	myFunc, otherFunc,
	/* startingBit= */ FPBits(OutputType(0x1.0p-10)).uintval(),
	/* endingBit= */ FPBits(OutputType(0x1.0p+10)).uintval(), 10'000'001,
	log);

	log << "Total number of differing results: " << diffCount << '\n';
	}
	};

	} // namespace testing
	} // namespace LIBC_NAMESPACE_DECL

	#define BINARY_OP_SINGLE_OUTPUT_PERF(OutputType, InputType, myFunc, otherFunc, \
	filename) \
	int main() { \
	LIBC_NAMESPACE::testing::BinaryOpSingleOutputPerf< \
	OutputType, InputType>::run_perf(&myFunc, &otherFunc, 1, filename); \
	return 0; \
	}

	#define BINARY_OP_SINGLE_OUTPUT_PERF_EX(OutputType, InputType, myFunc, \
	otherFunc, rounds, filename) \
	{ \
	LIBC_NAMESPACE::testing::BinaryOpSingleOutputPerf< \
	OutputType, InputType>::run_perf(&myFunc, &otherFunc, rounds, \
	filename); \
	LIBC_NAMESPACE::testing::BinaryOpSingleOutputPerf< \
	OutputType, InputType>::run_perf(&myFunc, &otherFunc, rounds, \
	filename); \
	}