frontend/hebench__matmult_8cpp_source.html

 // Copyright (C) 2021 Intel Corporation

 // SPDX-License-Identifier: Apache-2.0


 #include <cassert>

 #include <sstream>

 #include <stdexcept>


 #include "../include/hebench_matmult.h"


 namespace hebench {

 namespace TestHarness {

 namespace MatrixMultiply {


 //------------------------------------

 // class BenchmarkDescriptionCategory

 //------------------------------------


 hebench::APIBridge::WorkloadParamType::WorkloadParamType

     BenchmarkDescriptorCategory::WorkloadParameterType[BenchmarkDescriptorCategory::WorkloadParameterCount] = {

         hebench::APIBridge::WorkloadParamType::UInt64,

         hebench::APIBridge::WorkloadParamType::UInt64,

         hebench::APIBridge::WorkloadParamType::UInt64

     };


 std::array<std::pair<std::uint64_t, std::uint64_t>, BenchmarkDescriptorCategory::OpParameterCount>

 BenchmarkDescriptorCategory::fetchMatrixSizes(const std::vector<hebench::APIBridge::WorkloadParam> &w_params)

 {

     assert(WorkloadParameterCount == 3);

     assert(OpParameterCount == 2);

     assert(OpResultCount == 1);


     std::array<std::pair<std::uint64_t, std::uint64_t>, OpParameterCount> retval;


     if (w_params.size() < WorkloadParameterCount)

     {

         std::stringstream ss;

         ss << "Insufficient workload parameters in 'w_params'. Expected " << WorkloadParameterCount

            << ", but " << w_params.size() << "received.";

         throw std::invalid_argument(IL_LOG_MSG_CLASS(ss.str()));

     } // end if


     // validate workload parameters

     for (std::size_t i = 0; i < WorkloadParameterCount; ++i)

         if (w_params[i].data_type != WorkloadParameterType[i])

         {

             std::stringstream ss;

             ss << "Invalid type for workload parameter " << i

                << ". Expected type ID " << WorkloadParameterType[i] << ", but " << w_params[i].data_type << " received.";

             throw std::invalid_argument(IL_LOG_MSG_CLASS(ss.str()));

         } // end if

         else if (w_params[i].u_param <= 0)

         {

             std::stringstream ss;

             ss << "Invalid matrix size in workload parameter " << i

                << ". Expected positive integer, but " << w_params[i].u_param << " received.";

             throw std::invalid_argument(IL_LOG_MSG_CLASS(ss.str()));

         } // end if


     retval.at(0) = std::make_pair(w_params.at(0).u_param, w_params.at(1).u_param);

     retval.at(1) = std::make_pair(w_params.at(1).u_param, w_params.at(2).u_param);


     return retval;

 }


 void BenchmarkDescriptorCategory::completeWorkloadDescription(WorkloadDescriptionOutput &output,

                                                               const Engine &engine,

                                                               const BenchmarkDescription::Backend &backend_desc,

                                                               const BenchmarkDescription::Configuration &config) const

 {

     (void)engine;

     std::stringstream ss;


     output.concrete_descriptor = backend_desc.descriptor;

     PartialBenchmarkDescriptor::completeCategoryParams(output.concrete_descriptor,

                                                        backend_desc.descriptor,

                                                        config,

                                                        PartialBenchmarkDescriptor::getForceConfigValues());


     // workload name


     auto mat_dims = fetchMatrixSizes(config.w_params);

     ss << BaseWorkloadName << " ("

        << mat_dims[0].first << "x" << mat_dims[0].second << ") x ("

        << mat_dims[1].first << "x" << mat_dims[1].second << ")";


     output.workload_name          = ss.str();

     output.workload_base_name     = BaseWorkloadName;

     output.operation_params_count = BenchmarkDescriptorCategory::OpParameterCount;

 }


 bool BenchmarkDescriptorCategory::matchBenchmarkDescriptor(const hebench::APIBridge::BenchmarkDescriptor &bench_desc,

                                                            const std::vector<hebench::APIBridge::WorkloadParam> &w_params) const

 {

     bool retval = false;


     // return true if benchmark is supported

     if (bench_desc.workload == hebench::APIBridge::Workload::MatrixMultiply)

     {

         try

         {

             fetchMatrixSizes(w_params);

             retval = true;

         }

         catch (...)

         {

             // workload not supported

             retval = false;

         }

     } // end if


     return retval;

 }


 //---------------------------

 // class DataGeneratorHelper

 //---------------------------


 class DataGeneratorHelper

 {

 private:

     IL_DECLARE_CLASS_NAME(MatrixMultiply::DataGeneratorHelper)


 public:

     static void generateRandomMatrixN(hebench::APIBridge::DataType data_type,

                                       void *mat_result, std::uint64_t rows, std::uint64_t cols,

                                       double mean, double stddev);

     static void matMul(hebench::APIBridge::DataType data_type,

                        void *mat_result, const void *mat_a, const void *mat_b,

                        std::uint64_t rows_a, std::uint64_t cols_a, std::uint64_t cols_b);


 protected:

     DataGeneratorHelper() {}


 private:

     template <class T>

     static void matMul(T *mat_result, const T *mat_a, const T *mat_b,

                        std::uint64_t rows_a, std::uint64_t cols_a, std::uint64_t cols_b)

     {

         if (!mat_result)

             throw std::invalid_argument(IL_LOG_MSG_CLASS("Invalid null `mat_result`"));

         if (!mat_a)

             throw std::invalid_argument(IL_LOG_MSG_CLASS("Invalid null `mat_a`"));

         if (!mat_b)

             throw std::invalid_argument(IL_LOG_MSG_CLASS("Invalid null `mat_b`"));

         // perform matrix multiplication (straight-forward way,

         // maybe optimize later)

         for (std::uint64_t row_a = 0; row_a < rows_a; ++row_a)

             for (std::uint64_t col_b = 0; col_b < cols_b; ++col_b)

             {

                 mat_result[row_a * cols_b + col_b] = 0;

                 for (std::uint64_t col_a = 0; col_a < cols_a; ++col_a)

                 {

                     std::uint64_t row_b = col_a;

                     mat_result[row_a * cols_b + col_b] += mat_a[row_a * cols_a + col_a] * mat_b[row_b * cols_b + col_b];

                 } // end for

             } // end for

     }

 };


 void DataGeneratorHelper::generateRandomMatrixN(APIBridge::DataType data_type,

                                                 void *mat_result, std::uint64_t rows, std::uint64_t cols,

                                                 double mean, double stddev)

 {

     hebench::TestHarness::DataGeneratorHelper::generateRandomVectorN(data_type,

                                                                      mat_result, rows * cols,

                                                                      mean, stddev);

 }


 void DataGeneratorHelper::matMul(hebench::APIBridge::DataType data_type,

                                  void *mat_result,

                                  const void *mat_a, const void *mat_b,

                                  uint64_t rows_a, uint64_t cols_a, uint64_t cols_b)

 {

     switch (data_type)

     {

     case hebench::APIBridge::DataType::Int32:

         matMul<std::int32_t>(reinterpret_cast<std::int32_t *>(mat_result),

                              reinterpret_cast<const std::int32_t *>(mat_a), reinterpret_cast<const std::int32_t *>(mat_b),

                              rows_a, cols_a, cols_b);

         break;


     case hebench::APIBridge::DataType::Int64:

         matMul<std::int64_t>(reinterpret_cast<std::int64_t *>(mat_result),

                              reinterpret_cast<const std::int64_t *>(mat_a), reinterpret_cast<const std::int64_t *>(mat_b),

                              rows_a, cols_a, cols_b);

         break;


     case hebench::APIBridge::DataType::Float32:

         matMul<float>(reinterpret_cast<float *>(mat_result),

                       reinterpret_cast<const float *>(mat_a), reinterpret_cast<const float *>(mat_b),

                       rows_a, cols_a, cols_b);

         break;


     case hebench::APIBridge::DataType::Float64:

         matMul<double>(reinterpret_cast<double *>(mat_result),

                        reinterpret_cast<const double *>(mat_a), reinterpret_cast<const double *>(mat_b),

                        rows_a, cols_a, cols_b);

         break;


     default:

         throw std::invalid_argument(IL_LOG_MSG_CLASS("Unknown data type."));

         break;

     } // end switch

 }


 //------------------

 // class DataLoader

 //------------------


 DataLoader::Ptr DataLoader::create(std::uint64_t rows_a, std::uint64_t cols_a, std::uint64_t cols_b,

                                    std::uint64_t batch_size_mat_a,

                                    std::uint64_t batch_size_mat_b,

                                    hebench::APIBridge::DataType data_type)

 {

     DataLoader::Ptr retval = DataLoader::Ptr(new DataLoader());

     retval->init(rows_a, cols_a, cols_b, batch_size_mat_a, batch_size_mat_b, data_type);

     return retval;

 }


 DataLoader::Ptr DataLoader::create(std::uint64_t rows_a, std::uint64_t cols_a, std::uint64_t cols_b,

                                    std::uint64_t expected_sample_size_mat_a,

                                    std::uint64_t expected_sample_size_mat_b,

                                    hebench::APIBridge::DataType data_type,

                                    const std::string &dataset_filename)

 {

     DataLoader::Ptr retval = DataLoader::Ptr(new DataLoader());

     retval->init(rows_a, cols_a, cols_b,

                  expected_sample_size_mat_a, expected_sample_size_mat_b,

                  data_type,

                  dataset_filename);

     return retval;

 }


 DataLoader::DataLoader() :

     m_rows_a(0), m_cols_a(0), m_cols_b(0)

 {

 }


 void DataLoader::init(std::uint64_t rows_a, std::uint64_t cols_a, std::uint64_t cols_b,

                       std::uint64_t batch_size_mat_a,

                       std::uint64_t batch_size_mat_b,

                       hebench::APIBridge::DataType data_type)

 {

     // Load/generate and initialize the data for matrix multiplication:

     // M2 = M0 * M1


     // number of samples in each input parameter and output

     std::size_t batch_sizes[InputDim0 + OutputDim0] = {

         batch_size_mat_a,

         batch_size_mat_b,

         batch_size_mat_a * batch_size_mat_b

     };


     // store the dimensions of each matrix

     std::pair<std::uint64_t, std::uint64_t> mat_dims[InputDim0 + OutputDim0]; // rows <=> first, cols <=> second

     mat_dims[0] = std::make_pair(rows_a, cols_a);

     mat_dims[1] = std::make_pair(cols_a, cols_b);

     mat_dims[2] = std::make_pair(rows_a, cols_b);


     m_rows_a = rows_a;

     m_cols_a = cols_a;

     m_cols_b = cols_b;


     // compute number of elements in vector to hold each matrix data

     // matrices are kept in a single vector in row major order

     std::uint64_t sample_vector_sizes[InputDim0 + OutputDim0];

     for (std::size_t i = 0; i < InputDim0 + OutputDim0; ++i)

     {

         sample_vector_sizes[i] = mat_dims[i].first * mat_dims[i].second;

     } // end for


     // initialize data packs and allocate memory

     PartialDataLoader::init(data_type,

                             InputDim0, batch_sizes, sample_vector_sizes,

                             OutputDim0, sample_vector_sizes + InputDim0,

                             true);


     // at this point all NativeDataBuffers have been allocated and pointed to the correct locations


     // fill up the matrices data


     // input

     for (std::size_t mat_i = 0; mat_i < InputDim0; ++mat_i)

     {

         for (std::uint64_t i = 0; i < batch_sizes[mat_i]; ++i)

         {

             // generate the data

             DataGeneratorHelper::generateRandomMatrixN(data_type,

                                                        getParameterData(mat_i).p_buffers[i].p,

                                                        mat_dims[mat_i].first, // rows

                                                        mat_dims[mat_i].second, // columns

                                                        0.0, 10.0);

         } // end for

     } // end for


     // output

     //#pragma omp parallel for collapse(2)

     for (std::uint64_t m0_i = 0; m0_i < batch_sizes[0]; ++m0_i)

     {

         for (std::uint64_t m1_i = 0; m1_i < batch_sizes[1]; ++m1_i)

         {

             // find the index for the result buffer based on the input indices

             std::uint64_t ppi[] = { m0_i, m1_i };

             std::uint64_t r_i   = getResultIndex(ppi);


             // generate the data

             DataGeneratorHelper::matMul(data_type,

                                         getResultData(0).p_buffers[r_i].p,

                                         getParameterData(0).p_buffers[m0_i].p,

                                         getParameterData(1).p_buffers[m1_i].p,

                                         mat_dims[0].first, mat_dims[0].second, // dims for m0

                                         mat_dims[1].second); // dims for m1

         } // end for

     } // end for


     // all data has been generated at this point

 }


 void DataLoader::init(std::uint64_t rows_a, std::uint64_t cols_a, std::uint64_t cols_b,

                       std::uint64_t max_sample_size_mat_a,

                       std::uint64_t max_sample_size_mat_b,

                       hebench::APIBridge::DataType data_type,

                       const std::string &dataset_filename)

 {

     // Load/generate and initialize the data for matrix multiplication:

     // M2 = M0 * M1


     // number of samples in each input parameter and output

     std::size_t max_sample_sizes[InputDim0 + OutputDim0] = {

         max_sample_size_mat_a,

         max_sample_size_mat_b,

         max_sample_size_mat_a * max_sample_size_mat_b

     };


     // store the dimensions of each matrix

     std::pair<std::uint64_t, std::uint64_t> mat_dims[InputDim0 + OutputDim0]; // rows <=> first, cols <=> second

     mat_dims[0] = std::make_pair(rows_a, cols_a);

     mat_dims[1] = std::make_pair(cols_a, cols_b);

     mat_dims[2] = std::make_pair(rows_a, cols_b);


     m_rows_a = rows_a;

     m_cols_a = cols_a;

     m_cols_b = cols_b;


     // compute number of elements in vector to hold each matrix data

     // matrices are kept in a single vector in row major order

     std::uint64_t sample_vector_sizes[InputDim0 + OutputDim0];

     for (std::size_t i = 0; i < InputDim0 + OutputDim0; ++i)

     {

         sample_vector_sizes[i] = mat_dims[i].first * mat_dims[i].second;

     } // end for


     PartialDataLoader::init(dataset_filename, data_type,

                             InputDim0, max_sample_sizes, sample_vector_sizes,

                             OutputDim0, sample_vector_sizes + InputDim0);


     // at this point all NativeDataBuffers have been allocated, pointed to the correct locations

     // and buffers loaded with data from dataset_filename

 }


 void DataLoader::computeResult(std::vector<hebench::APIBridge::NativeDataBuffer *> &result,

                                const std::uint64_t *param_data_pack_indices,

                                hebench::APIBridge::DataType data_type)

 {

     // as protected method, parameters should be valid when called


     // generate the output

     DataGeneratorHelper::matMul(data_type,

                                 result.front()->p,

                                 this->getParameterData(0).p_buffers[param_data_pack_indices[0]].p,

                                 this->getParameterData(1).p_buffers[param_data_pack_indices[1]].p,

                                 m_rows_a, m_cols_a, // dims for m0

                                 m_cols_b); // dims for m1

 }


 } // namespace MatrixMultiply

 } // namespace TestHarness

 } // namespace hebench

hebench::TestHarness::BenchmarkDescription::Backend
Definition: hebench_benchmark_description.h:27

hebench::TestHarness::BenchmarkDescription::Backend::descriptor
const hebench::APIBridge::BenchmarkDescriptor & descriptor
Benchmark backend descriptor, as retrieved by backend, corresponding to the registration handle h_des...
Definition: hebench_benchmark_description.h:53

hebench::TestHarness::BenchmarkDescription::Configuration
Specifies a benchmark configuration.
Definition: hebench_benchmark_description.h:107

hebench::TestHarness::BenchmarkDescription::Configuration::w_params
std::vector< hebench::APIBridge::WorkloadParam > w_params
Set of arguments for workload parameters.
Definition: hebench_benchmark_description.h:151

hebench::TestHarness::DataGeneratorHelper::generateRandomVectorN
static void generateRandomVectorN(hebench::APIBridge::DataType data_type, void *result, std::uint64_t elem_count, double mean, double stddev)
Generates normally distributed random data of the specified type.
Definition: datagen_helper.cpp:123

hebench::TestHarness::Engine
Definition: hebench_engine.h:23

hebench::TestHarness::MatrixMultiply::BenchmarkDescriptorCategory::fetchMatrixSizes
static std::array< std::pair< std::uint64_t, std::uint64_t >, OpParameterCount > fetchMatrixSizes(const std::vector< hebench::APIBridge::WorkloadParam > &w_params)
fetchMatrixSizes
Definition: hebench_matmult.cpp:27

hebench::TestHarness::MatrixMultiply::BenchmarkDescriptorCategory::matchBenchmarkDescriptor
bool matchBenchmarkDescriptor(const hebench::APIBridge::BenchmarkDescriptor &bench_desc, const std::vector< hebench::APIBridge::WorkloadParam > &w_params) const override
Determines if the represented benchmark can perform the workload described by a specified HEBench ben...
Definition: hebench_matmult.cpp:92

hebench::TestHarness::MatrixMultiply::BenchmarkDescriptorCategory::BaseWorkloadName
static constexpr const char * BaseWorkloadName
Definition: hebench_matmult.h:34

hebench::TestHarness::MatrixMultiply::BenchmarkDescriptorCategory::WorkloadParameterCount
static constexpr std::uint64_t WorkloadParameterCount
Definition: hebench_matmult.h:35

hebench::TestHarness::MatrixMultiply::BenchmarkDescriptorCategory::OpParameterCount
static constexpr std::uint64_t OpParameterCount
Definition: hebench_matmult.h:36

hebench::TestHarness::MatrixMultiply::BenchmarkDescriptorCategory::completeWorkloadDescription
void completeWorkloadDescription(WorkloadDescriptionOutput &output, const Engine &engine, const BenchmarkDescription::Backend &backend_desc, const BenchmarkDescription::Configuration &config) const override
Completes the description for the matched benchmark.
Definition: hebench_matmult.cpp:66

hebench::TestHarness::MatrixMultiply::BenchmarkDescriptorCategory::WorkloadParameterType
static hebench::APIBridge::WorkloadParamType::WorkloadParamType WorkloadParameterType[WorkloadParameterCount]
Definition: hebench_matmult.h:38

hebench::TestHarness::MatrixMultiply::BenchmarkDescriptorCategory::OpResultCount
static constexpr std::uint64_t OpResultCount
Definition: hebench_matmult.h:37

hebench::TestHarness::MatrixMultiply::DataGeneratorHelper
Static helper class to generate matrix data for all supported data types.
Definition: hebench_matmult.cpp:123

hebench::TestHarness::MatrixMultiply::DataGeneratorHelper::generateRandomMatrixN
static void generateRandomMatrixN(hebench::APIBridge::DataType data_type, void *mat_result, std::uint64_t rows, std::uint64_t cols, double mean, double stddev)
Definition: hebench_matmult.cpp:164

hebench::TestHarness::MatrixMultiply::DataGeneratorHelper::DataGeneratorHelper
DataGeneratorHelper()
Definition: hebench_matmult.cpp:136

hebench::TestHarness::MatrixMultiply::DataGeneratorHelper::matMul
static void matMul(hebench::APIBridge::DataType data_type, void *mat_result, const void *mat_a, const void *mat_b, std::uint64_t rows_a, std::uint64_t cols_a, std::uint64_t cols_b)

hebench::TestHarness::MatrixMultiply::DataLoader
Definition: hebench_matmult.h:63

hebench::TestHarness::MatrixMultiply::DataLoader::create
static DataLoader::Ptr create(std::uint64_t rows_a, std::uint64_t cols_a, std::uint64_t cols_b, std::uint64_t batch_size_mat_a, std::uint64_t batch_size_mat_b, hebench::APIBridge::DataType data_type)
Definition: hebench_matmult.cpp:214

hebench::TestHarness::MatrixMultiply::DataLoader::computeResult
void computeResult(std::vector< hebench::APIBridge::NativeDataBuffer * > &result, const std::uint64_t *param_data_pack_indices, hebench::APIBridge::DataType data_type) override
Computes result of the operation on the input data given the of the input sample.
Definition: hebench_matmult.cpp:365

hebench::TestHarness::MatrixMultiply::DataLoader::Ptr
std::shared_ptr< DataLoader > Ptr
Definition: hebench_matmult.h:71

hebench::TestHarness::PartialBenchmarkDescriptor::completeCategoryParams
static void completeCategoryParams(hebench::APIBridge::BenchmarkDescriptor &out_descriptor, const hebench::APIBridge::BenchmarkDescriptor &in_descriptor, const BenchmarkDescription::Configuration &config, bool force_config)
Completes common elements of category parameters in a descriptor using the specified configuration.
Definition: hebench_ibenchmark.cpp:193

hebench::TestHarness::PartialBenchmarkDescriptor::getForceConfigValues
static bool getForceConfigValues()
Specifies whether frontend will override backend descriptors using configuration data or not.
Definition: hebench_ibenchmark.h:205

hebench::TestHarness::PartialBenchmarkDescriptor::WorkloadDescriptionOutput::operation_params_count
std::size_t operation_params_count
Number of parameters for the represented workload operation.
Definition: hebench_ibenchmark.h:298

hebench::TestHarness::PartialBenchmarkDescriptor::WorkloadDescriptionOutput::workload_name
std::string workload_name
Human-readable friendly name for the represented workload to be used for its description on the repor...
Definition: hebench_ibenchmark.h:312

hebench::TestHarness::PartialBenchmarkDescriptor::WorkloadDescriptionOutput::concrete_descriptor
hebench::APIBridge::BenchmarkDescriptor concrete_descriptor
Benchmark descriptor completed with concrete values assigned to configurable fields.
Definition: hebench_ibenchmark.h:302

hebench::TestHarness::PartialBenchmarkDescriptor::WorkloadDescriptionOutput::workload_base_name
std::string workload_base_name
Human-readable friendly name for the represented workload to be used for its description on the repor...
Definition: hebench_ibenchmark.h:307

hebench::TestHarness::PartialBenchmarkDescriptor::WorkloadDescriptionOutput
Bundles values that need to be filled by a workload during completeWorkloadDescription().
Definition: hebench_ibenchmark.h:294

hebench::TestHarness::PartialDataLoader::getResultData
const hebench::APIBridge::DataPack & getResultData(std::uint64_t param_position) const override
Data pack corresponding to the specified component of the result.
Definition: hebench_idata_loader.cpp:654

hebench::TestHarness::PartialDataLoader::getParameterData
const hebench::APIBridge::DataPack & getParameterData(std::uint64_t param_position) const override
Data pack for specified operation parameter (operand).
Definition: hebench_idata_loader.cpp:643

hebench::TestHarness::PartialDataLoader::init
void init(hebench::APIBridge::DataType data_type, std::size_t input_dim, const std::size_t *input_sample_count_per_dim, const std::uint64_t *input_count_per_dim, std::size_t output_dim, const std::uint64_t *output_count_per_dim, bool allocate_output)
Initializes dimensions of inputs and outputs. No allocation is performed.
Definition: hebench_idata_loader.cpp:388

hebench::TestHarness::PartialDataLoader::getResultIndex
std::uint64_t getResultIndex(const std::uint64_t *param_data_pack_indices) const override
Computes the index of the result NativeDataBuffer given the indices of the input data.
Definition: hebench_idata_loader.cpp:693

hebench::APIBridge::WorkloadParamType::WorkloadParamType
WorkloadParamType
Defines the possible data types for a workload flexible parameter.
Definition: types.h:303

hebench::APIBridge::WorkloadParamType::Float64
@ Float64
64 bits IEEE 754 standard floating point real numbers.
Definition: types.h:306

hebench::APIBridge::WorkloadParamType::Int64
@ Int64
64 bits signed integers.
Definition: types.h:304

hebench::APIBridge::WorkloadParamType::UInt64
@ UInt64
64 bits unsigned integers.
Definition: types.h:305

hebench::APIBridge::DataType
DataType
Defines data types for a workload.
Definition: types.h:379

hebench::APIBridge::Float32
@ Float32
32 bits IEEE 754 standard floating point real numbers.
Definition: types.h:382

hebench::APIBridge::Int32
@ Int32
32 bits signed integers.
Definition: types.h:380

hebench::APIBridge::BenchmarkDescriptor::workload
Workload workload
Workload for the benchmark.
Definition: types.h:529

hebench::APIBridge::MatrixMultiply
@ MatrixMultiply
Definition: types.h:104

hebench::APIBridge::BenchmarkDescriptor
Defines a benchmark test.
Definition: types.h:527

hebench
Definition: hebench_benchmark_category.h:18