cheriot/test/riscv_cheriot_vector_fp_reduction_instructions_test.cc - mpact-cheriot - Git at Google

 // Copyright 2023 Google LLC
 //
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 //     https://www.apache.org/licenses/LICENSE-2.0
 //
 // Unless required by applicable law or agreed to in writing, software
 // distributed under the License is distributed on an "AS IS" BASIS,
 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 // See the License for the specific language governing permissions and
 // limitations under the License.

 #include "cheriot/riscv_cheriot_vector_fp_reduction_instructions.h"

 #include <algorithm>
 #include <cstdint>
 #include <functional>
 #include <vector>

 #include "absl/random/random.h"
 #include "absl/strings/str_cat.h"
 #include "absl/strings/string_view.h"
 #include "absl/types/span.h"
 #include "cheriot/test/riscv_cheriot_vector_fp_test_utilities.h"
 #include "cheriot/test/riscv_cheriot_vector_instructions_test_base.h"
 #include "googlemock/include/gmock/gmock.h"
 #include "mpact/sim/generic/instruction.h"
 #include "riscv//riscv_fp_host.h"
 #include "riscv//riscv_fp_info.h"
 #include "riscv//riscv_fp_state.h"
 #include "riscv//riscv_register.h"

 namespace {

 using Instruction = ::mpact::sim::generic::Instruction;

 // Functions to test.

 using ::mpact::sim::cheriot::Vfredmax;
 using ::mpact::sim::cheriot::Vfredmin;
 using ::mpact::sim::cheriot::Vfredosum;
 using ::mpact::sim::cheriot::Vfwredosum;

 using ::absl::Span;
 using ::mpact::sim::riscv::FPRoundingMode;
 using ::mpact::sim::riscv::RVFpRegister;
 using ::mpact::sim::riscv::ScopedFPStatus;

 // Test fixture for binary fp instructions.
 class RiscVCheriotFPReductionInstructionsTest
     : public RiscVCheriotFPInstructionsTestBase {
  public:
   // Helper function for floating point reduction operations.
   template <typename Vd, typename Vs2, typename Vs1>
   void ReductionOpFPTestHelper(absl::string_view name, int sew,
                                Instruction *inst, int delta_position,
                                std::function<Vd(Vs1, Vs2)> operation) {
     int byte_sew = sew / 8;
     if (byte_sew != sizeof(Vd) && byte_sew != sizeof(Vs2) &&
         byte_sew != sizeof(Vs1)) {
       FAIL() << name << ": selected element width != any operand types"
              << "sew: " << sew << " Vd: " << sizeof(Vd)
              << " Vs2: " << sizeof(Vs2) << " Vs1: " << sizeof(Vs1);
       return;
     }
     // Number of elements per vector register.
     constexpr int vs2_size = kVectorLengthInBytes / sizeof(Vs2);
     constexpr int vs1_size = kVectorLengthInBytes / sizeof(Vs1);
     // Input values for 8 registers.
     Vs2 vs2_value[vs2_size * 8];
     auto vs2_span = Span<Vs2>(vs2_value);
     Vs1 vs1_value[vs1_size * 8];
     auto vs1_span = Span<Vs1>(vs1_value);
     AppendVectorRegisterOperands({kVs2, kVs1, kVmask}, {kVd});
     auto mask_span = Span<const uint8_t>(kA5Mask);
     SetVectorRegisterValues<uint8_t>({{kVmaskName, mask_span}});
     // Iterate across the different lmul values.
     for (int lmul_index = 0; lmul_index < 7; lmul_index++) {
       // Initialize input values.
       FillArrayWithRandomFPValues<Vs2>(vs2_span);
       FillArrayWithRandomFPValues<Vs1>(vs1_span);
       for (int i = 0; i < 8; i++) {
         auto vs2_name = absl::StrCat("v", kVs2 + i);
         auto vs1_name = absl::StrCat("v", kVs1 + i);
         SetVectorRegisterValues<Vs2>(
             {{vs2_name, vs2_span.subspan(vs2_size * i, vs2_size)}});
         SetVectorRegisterValues<Vs1>(
             {{vs1_name, vs1_span.subspan(vs1_size * i, vs1_size)}});
       }
       for (int vlen_count = 0; vlen_count < 4; vlen_count++) {
         int lmul8 = kLmul8Values[lmul_index];
         int lmul8_vs2 = lmul8 * sizeof(Vs2) / byte_sew;
         int lmul8_vs1 = lmul8 * sizeof(Vs1) / byte_sew;
         int lmul8_vd = lmul8 * sizeof(Vd) / byte_sew;
         int num_values = lmul8 * kVectorLengthInBytes / (8 * byte_sew);
         // Set vlen, but leave vlen high at least once.
         int vlen = 1024;
         if (vlen_count > 0) {
           vlen =
               absl::Uniform(absl::IntervalOpenClosed, bitgen_, 0, num_values);
         }
         num_values = std::min(num_values, vlen);
         // Configure vector unit for different lmul settings.
         uint32_t vtype =
             (kSewSettingsByByteSize[byte_sew] << 3) | kLmulSettings[lmul_index];
         ConfigureVectorUnit(vtype, vlen);

         // Iterate across rounding modes.
         for (int rm : {0, 1, 2, 3, 4}) {
           rv_fp_->SetRoundingMode(static_cast<FPRoundingMode>(rm));

           ClearVectorRegisterGroup(kVd, 8);

           inst->Execute();

           if (lmul8_vd < 1 || lmul8_vd > 64) {
             EXPECT_TRUE(rv_vector_->vector_exception())
                 << "lmul8: vd: " << lmul8_vd;
             rv_vector_->clear_vector_exception();
             continue;
           }

           if (lmul8_vs2 < 1 || lmul8_vs2 > 64) {
             EXPECT_TRUE(rv_vector_->vector_exception())
                 << "lmul8: vs2: " << lmul8_vs2;
             rv_vector_->clear_vector_exception();
             continue;
           }

           if (lmul8_vs1 < 1 || lmul8_vs1 > 64) {
             EXPECT_TRUE(rv_vector_->vector_exception())
                 << "lmul8: vs1: " << lmul8_vs1;
             rv_vector_->clear_vector_exception();
             continue;
           }
           EXPECT_FALSE(rv_vector_->vector_exception());
           // Initialize the accumulator with the value from vs1[0].
           Vd accumulator = static_cast<Vd>(vs1_span[0]);
           ScopedFPStatus set_fpstatus(rv_fp_->host_fp_interface());
           for (int i = 0; i < num_values; i++) {
             int mask_index = i >> 3;
             int mask_offset = i & 0b111;
             bool mask_value = (mask_span[mask_index] >> mask_offset) & 0b1;
             if (mask_value) {
               accumulator = operation(accumulator, vs2_span[i]);
             }
           }
           auto reg_val = vreg_[kVd]->data_buffer()->Get<Vd>(0);
           FPCompare<Vd>(accumulator, reg_val, delta_position, "");
         }
       }
     }
   }
 };

 // Test vector floating point sum reduction.
 TEST_F(RiscVCheriotFPReductionInstructionsTest, Vfredosum) {
   SetSemanticFunction(&Vfredosum);
   ReductionOpFPTestHelper<float, float, float>(
       "Vfredosum_32", /*sew*/ 32, instruction_, /*delta_position*/ 32,
       [](float val0, float val1) -> float { return val0 + val1; });
   ResetInstruction();
   SetSemanticFunction(&Vfredosum);
   ReductionOpFPTestHelper<double, double, double>(
       "Vfredosum_64", /*sew*/ 64, instruction_, /*delta_position*/ 64,
       [](double val0, double val1) -> double { return val0 + val1; });
 }

 // Test vector floating point widening sum reduction.
 TEST_F(RiscVCheriotFPReductionInstructionsTest, Vfwredosum) {
   SetSemanticFunction(&Vfwredosum);
   ReductionOpFPTestHelper<double, float, double>(
       "Vfwredosum_32", /*sew*/ 32, instruction_, /*delta_position*/ 64,
       [](double val0, float val1) -> double {
         return val0 + static_cast<double>(val1);
       });
 }

 template <typename T>
 T MaxMinHelper(T vs2, T vs1, std::function<T(T, T)> operation) {
   using UInt = typename FPTypeInfo<T>::IntType;
   UInt vs2_uint = *reinterpret_cast<UInt *>(&vs2);
   UInt vs1_uint = *reinterpret_cast<UInt *>(&vs1);
   UInt mask = 1ULL << (FPTypeInfo<T>::kSigSize - 1);
   bool nan_vs2 = std::isnan(vs2);
   bool nan_vs1 = std::isnan(vs1);
   if ((nan_vs2 && ((mask & vs2_uint) == 0)) ||
       (nan_vs1 && ((mask & vs1_uint) == 0)) || (nan_vs2 && nan_vs1)) {
     // Canonical NaN.
     UInt canonical = ((1ULL << (FPTypeInfo<T>::kExpSize + 1)) - 1)
                      << (FPTypeInfo<T>::kSigSize - 1);
     T canonical_fp = *reinterpret_cast<T *>(&canonical);
     return canonical_fp;
   }
   if (nan_vs2) return vs1;
   if (nan_vs1) return vs2;
   return operation(vs2, vs1);
 }

 // Test vector floating point min reduction.
 TEST_F(RiscVCheriotFPReductionInstructionsTest, Vfredmin) {
   SetSemanticFunction(&Vfredmin);
   ReductionOpFPTestHelper<float, float, float>(
       "Vfredmin_32", /*sew*/ 32, instruction_, /*delta_position*/ 32,
       [](float val0, float val1) -> float {
         return MaxMinHelper<float>(val0, val1,
                                    [](float val0, float val1) -> float {
                                      return (val0 > val1) ? val1 : val0;
                                    });
       });
   ResetInstruction();
   SetSemanticFunction(&Vfredmin);
   ReductionOpFPTestHelper<double, double, double>(
       "Vfredmin_64", /*sew*/ 64, instruction_, /*delta_position*/ 64,
       [](double val0, double val1) -> double {
         return MaxMinHelper<double>(val0, val1,
                                     [](double val0, double val1) -> double {
                                       return (val0 > val1) ? val1 : val0;
                                     });
       });
 }

 // Test vector floating point max reduction.
 TEST_F(RiscVCheriotFPReductionInstructionsTest, Vfredmax) {
   SetSemanticFunction(&Vfredmax);
   ReductionOpFPTestHelper<float, float, float>(
       "Vfredmin_32", /*sew*/ 32, instruction_, /*delta_position*/ 32,
       [](float val0, float val1) -> float {
         return MaxMinHelper<float>(val0, val1,
                                    [](float val0, float val1) -> float {
                                      return (val0 < val1) ? val1 : val0;
                                    });
       });
   ResetInstruction();
   SetSemanticFunction(&Vfredmax);
   ReductionOpFPTestHelper<double, double, double>(
       "Vfredmin_64", /*sew*/ 64, instruction_, /*delta_position*/ 64,
       [](double val0, double val1) -> double {
         return MaxMinHelper<double>(val0, val1,
                                     [](double val0, double val1) -> double {
                                       return (val0 < val1) ? val1 : val0;
                                     });
       });
 }

 }  // namespace
	// Copyright 2023 Google LLC
	//
	// Licensed under the Apache License, Version 2.0 (the "License");
	// you may not use this file except in compliance with the License.
	// You may obtain a copy of the License at
	//
	// https://www.apache.org/licenses/LICENSE-2.0
	//
	// Unless required by applicable law or agreed to in writing, software
	// distributed under the License is distributed on an "AS IS" BASIS,
	// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	// See the License for the specific language governing permissions and
	// limitations under the License.

	#include "cheriot/riscv_cheriot_vector_fp_reduction_instructions.h"

	#include <algorithm>
	#include <cstdint>
	#include <functional>
	#include <vector>

	#include "absl/random/random.h"
	#include "absl/strings/str_cat.h"
	#include "absl/strings/string_view.h"
	#include "absl/types/span.h"
	#include "cheriot/test/riscv_cheriot_vector_fp_test_utilities.h"
	#include "cheriot/test/riscv_cheriot_vector_instructions_test_base.h"
	#include "googlemock/include/gmock/gmock.h"
	#include "mpact/sim/generic/instruction.h"
	#include "riscv//riscv_fp_host.h"
	#include "riscv//riscv_fp_info.h"
	#include "riscv//riscv_fp_state.h"
	#include "riscv//riscv_register.h"

	namespace {

	using Instruction = ::mpact::sim::generic::Instruction;

	// Functions to test.

	using ::mpact::sim::cheriot::Vfredmax;
	using ::mpact::sim::cheriot::Vfredmin;
	using ::mpact::sim::cheriot::Vfredosum;
	using ::mpact::sim::cheriot::Vfwredosum;

	using ::absl::Span;
	using ::mpact::sim::riscv::FPRoundingMode;
	using ::mpact::sim::riscv::RVFpRegister;
	using ::mpact::sim::riscv::ScopedFPStatus;

	// Test fixture for binary fp instructions.
	class RiscVCheriotFPReductionInstructionsTest
	: public RiscVCheriotFPInstructionsTestBase {
	public:
	// Helper function for floating point reduction operations.
	template <typename Vd, typename Vs2, typename Vs1>
	void ReductionOpFPTestHelper(absl::string_view name, int sew,
	Instruction *inst, int delta_position,
	std::function<Vd(Vs1, Vs2)> operation) {
	int byte_sew = sew / 8;
	if (byte_sew != sizeof(Vd) && byte_sew != sizeof(Vs2) &&
	byte_sew != sizeof(Vs1)) {
	FAIL() << name << ": selected element width != any operand types"
	<< "sew: " << sew << " Vd: " << sizeof(Vd)
	<< " Vs2: " << sizeof(Vs2) << " Vs1: " << sizeof(Vs1);
	return;
	}
	// Number of elements per vector register.
	constexpr int vs2_size = kVectorLengthInBytes / sizeof(Vs2);
	constexpr int vs1_size = kVectorLengthInBytes / sizeof(Vs1);
	// Input values for 8 registers.
	Vs2 vs2_value[vs2_size * 8];
	auto vs2_span = Span<Vs2>(vs2_value);
	Vs1 vs1_value[vs1_size * 8];
	auto vs1_span = Span<Vs1>(vs1_value);
	AppendVectorRegisterOperands({kVs2, kVs1, kVmask}, {kVd});
	auto mask_span = Span<const uint8_t>(kA5Mask);
	SetVectorRegisterValues<uint8_t>({{kVmaskName, mask_span}});
	// Iterate across the different lmul values.
	for (int lmul_index = 0; lmul_index < 7; lmul_index++) {
	// Initialize input values.
	FillArrayWithRandomFPValues<Vs2>(vs2_span);
	FillArrayWithRandomFPValues<Vs1>(vs1_span);
	for (int i = 0; i < 8; i++) {
	auto vs2_name = absl::StrCat("v", kVs2 + i);
	auto vs1_name = absl::StrCat("v", kVs1 + i);
	SetVectorRegisterValues<Vs2>(
	{{vs2_name, vs2_span.subspan(vs2_size * i, vs2_size)}});
	SetVectorRegisterValues<Vs1>(
	{{vs1_name, vs1_span.subspan(vs1_size * i, vs1_size)}});
	}
	for (int vlen_count = 0; vlen_count < 4; vlen_count++) {
	int lmul8 = kLmul8Values[lmul_index];
	int lmul8_vs2 = lmul8 * sizeof(Vs2) / byte_sew;
	int lmul8_vs1 = lmul8 * sizeof(Vs1) / byte_sew;
	int lmul8_vd = lmul8 * sizeof(Vd) / byte_sew;
	int num_values = lmul8 * kVectorLengthInBytes / (8 * byte_sew);
	// Set vlen, but leave vlen high at least once.
	int vlen = 1024;
	if (vlen_count > 0) {
	vlen =
	absl::Uniform(absl::IntervalOpenClosed, bitgen_, 0, num_values);
	}
	num_values = std::min(num_values, vlen);
	// Configure vector unit for different lmul settings.
	uint32_t vtype =
	(kSewSettingsByByteSize[byte_sew] << 3) \| kLmulSettings[lmul_index];
	ConfigureVectorUnit(vtype, vlen);

	// Iterate across rounding modes.
	for (int rm : {0, 1, 2, 3, 4}) {
	rv_fp_->SetRoundingMode(static_cast<FPRoundingMode>(rm));

	ClearVectorRegisterGroup(kVd, 8);

	inst->Execute();

	if (lmul8_vd < 1 \|\| lmul8_vd > 64) {
	EXPECT_TRUE(rv_vector_->vector_exception())
	<< "lmul8: vd: " << lmul8_vd;
	rv_vector_->clear_vector_exception();
	continue;
	}

	if (lmul8_vs2 < 1 \|\| lmul8_vs2 > 64) {
	EXPECT_TRUE(rv_vector_->vector_exception())
	<< "lmul8: vs2: " << lmul8_vs2;
	rv_vector_->clear_vector_exception();
	continue;
	}

	if (lmul8_vs1 < 1 \|\| lmul8_vs1 > 64) {
	EXPECT_TRUE(rv_vector_->vector_exception())
	<< "lmul8: vs1: " << lmul8_vs1;
	rv_vector_->clear_vector_exception();
	continue;
	}
	EXPECT_FALSE(rv_vector_->vector_exception());
	// Initialize the accumulator with the value from vs1[0].
	Vd accumulator = static_cast<Vd>(vs1_span[0]);
	ScopedFPStatus set_fpstatus(rv_fp_->host_fp_interface());
	for (int i = 0; i < num_values; i++) {
	int mask_index = i >> 3;
	int mask_offset = i & 0b111;
	bool mask_value = (mask_span[mask_index] >> mask_offset) & 0b1;
	if (mask_value) {
	accumulator = operation(accumulator, vs2_span[i]);
	}
	}
	auto reg_val = vreg_[kVd]->data_buffer()->Get<Vd>(0);
	FPCompare<Vd>(accumulator, reg_val, delta_position, "");
	}
	}
	}
	}
	};

	// Test vector floating point sum reduction.
	TEST_F(RiscVCheriotFPReductionInstructionsTest, Vfredosum) {
	SetSemanticFunction(&Vfredosum);
	ReductionOpFPTestHelper<float, float, float>(
	"Vfredosum_32", /sew/ 32, instruction_, /delta_position/ 32,
	[](float val0, float val1) -> float { return val0 + val1; });
	ResetInstruction();
	SetSemanticFunction(&Vfredosum);
	ReductionOpFPTestHelper<double, double, double>(
	"Vfredosum_64", /sew/ 64, instruction_, /delta_position/ 64,
	[](double val0, double val1) -> double { return val0 + val1; });
	}

	// Test vector floating point widening sum reduction.
	TEST_F(RiscVCheriotFPReductionInstructionsTest, Vfwredosum) {
	SetSemanticFunction(&Vfwredosum);
	ReductionOpFPTestHelper<double, float, double>(
	"Vfwredosum_32", /sew/ 32, instruction_, /delta_position/ 64,
	[](double val0, float val1) -> double {
	return val0 + static_cast<double>(val1);
	});
	}

	template <typename T>
	T MaxMinHelper(T vs2, T vs1, std::function<T(T, T)> operation) {
	using UInt = typename FPTypeInfo<T>::IntType;
	UInt vs2_uint = reinterpret_cast<UInt >(&vs2);
	UInt vs1_uint = reinterpret_cast<UInt >(&vs1);
	UInt mask = 1ULL << (FPTypeInfo<T>::kSigSize - 1);
	bool nan_vs2 = std::isnan(vs2);
	bool nan_vs1 = std::isnan(vs1);
	if ((nan_vs2 && ((mask & vs2_uint) == 0)) \|\|
	(nan_vs1 && ((mask & vs1_uint) == 0)) \|\| (nan_vs2 && nan_vs1)) {
	// Canonical NaN.
	UInt canonical = ((1ULL << (FPTypeInfo<T>::kExpSize + 1)) - 1)
	<< (FPTypeInfo<T>::kSigSize - 1);
	T canonical_fp = reinterpret_cast<T >(&canonical);
	return canonical_fp;
	}
	if (nan_vs2) return vs1;
	if (nan_vs1) return vs2;
	return operation(vs2, vs1);
	}

	// Test vector floating point min reduction.
	TEST_F(RiscVCheriotFPReductionInstructionsTest, Vfredmin) {
	SetSemanticFunction(&Vfredmin);
	ReductionOpFPTestHelper<float, float, float>(
	"Vfredmin_32", /sew/ 32, instruction_, /delta_position/ 32,
	[](float val0, float val1) -> float {
	return MaxMinHelper<float>(val0, val1,
	[](float val0, float val1) -> float {
	return (val0 > val1) ? val1 : val0;
	});
	});
	ResetInstruction();
	SetSemanticFunction(&Vfredmin);
	ReductionOpFPTestHelper<double, double, double>(
	"Vfredmin_64", /sew/ 64, instruction_, /delta_position/ 64,
	[](double val0, double val1) -> double {
	return MaxMinHelper<double>(val0, val1,
	[](double val0, double val1) -> double {
	return (val0 > val1) ? val1 : val0;
	});
	});
	}

	// Test vector floating point max reduction.
	TEST_F(RiscVCheriotFPReductionInstructionsTest, Vfredmax) {
	SetSemanticFunction(&Vfredmax);
	ReductionOpFPTestHelper<float, float, float>(
	"Vfredmin_32", /sew/ 32, instruction_, /delta_position/ 32,
	[](float val0, float val1) -> float {
	return MaxMinHelper<float>(val0, val1,
	[](float val0, float val1) -> float {
	return (val0 < val1) ? val1 : val0;
	});
	});
	ResetInstruction();
	SetSemanticFunction(&Vfredmax);
	ReductionOpFPTestHelper<double, double, double>(
	"Vfredmin_64", /sew/ 64, instruction_, /delta_position/ 64,
	[](double val0, double val1) -> double {
	return MaxMinHelper<double>(val0, val1,
	[](double val0, double val1) -> double {
	return (val0 < val1) ? val1 : val0;
	});
	});
	}

	} // namespace