frontend/hebench__matmult__l_8cpp_source.html

 // Copyright (C) 2021 Intel Corporation

 // SPDX-License-Identifier: Apache-2.0


 #include <bitset>

 #include <cassert>

 #include <cstring>

 #include <iomanip>

 #include <iostream>

 #include <sstream>

 #include <stdexcept>

 #include <utility>


 #include "hebench/modules/logging/include/logging.h"

 #include "hebench/modules/timer/include/timer.h"


 #include "hebench/api_bridge/api.h"

 #include "hebench/modules/general/include/hebench_math_utils.h"

 #include "include/hebench_engine.h"


 #include "../include/hebench_matmult_l.h"


 namespace hebench {

 namespace TestHarness {

 namespace MatrixMultiply {

 namespace Latency {


 //----------------------------

 // class BenchmarkDescription

 //----------------------------


 bool BenchmarkDescriptor::m_b_registered = // register the benchmark with the factory

     hebench::TestHarness::BenchmarkFactory::registerSupportedBenchmark(std::make_shared<BenchmarkDescriptor>());


 bool BenchmarkDescriptor::matchBenchmarkDescriptor(const hebench::APIBridge::BenchmarkDescriptor &bench_desc,

                                                    const std::vector<hebench::APIBridge::WorkloadParam> &w_params) const

 {

     assert(m_b_registered);


     // return true if benchmark is supported


     bool retval =

         BenchmarkDescriptorCategory::matchBenchmarkDescriptor(bench_desc, w_params)

         && (bench_desc.category == hebench::APIBridge::Category::Latency);


     return retval;

 }


 void BenchmarkDescriptor::completeWorkloadDescription(WorkloadDescriptionOutput &output,

                                                       const Engine &engine,

                                                       const BenchmarkDescription::Backend &backend_desc,

                                                       const BenchmarkDescription::Configuration &config) const

 {

     assert(OpParameterCount == 2);

     assert(DefaultBatchSize == 1);


     BenchmarkDescriptorCategory::completeWorkloadDescription(output, engine, backend_desc, config);


     assert(OpParameterCount == output.operation_params_count);


     // finish benchmark header description


     std::stringstream ss;

     std::uint64_t batch_sizes[OpParameterCount];

     std::array<std::pair<std::uint64_t, std::uint64_t>, OpParameterCount> mat_dims =

         fetchMatrixSizes(config.w_params);


     ss = std::stringstream();


     std::uint64_t result_batch_size = 1;

     for (std::size_t param_i = 0; param_i < OpParameterCount; ++param_i)

     {

         batch_sizes[param_i] = DefaultBatchSize;

         result_batch_size *= batch_sizes[param_i];

     } // end for

     // complete header with workload specifics

     ss << ", , M = M0 x M1" << std::endl

        << ", , , Rows, Columns, Batch size" << std::endl;

     for (std::size_t i = 0; i < OpParameterCount; ++i)

     {

         ss << ", , M" << i << ", " << mat_dims[i].first << ", " << mat_dims[i].second << ", " << batch_sizes[i] << std::endl;

     } // end for

     ss << ", , M, " << mat_dims[0].first << ", " << mat_dims[1].second << ", " << result_batch_size << std::endl;


     output.workload_header = ss.str();

 }


 hebench::TestHarness::PartialBenchmark *BenchmarkDescriptor::createBenchmark(std::shared_ptr<Engine> p_engine,

                                                                              const DescriptionToken &description_token)

 {

     assert(m_b_registered);

     Benchmark *retval = nullptr;


     try

     {

         retval = new Benchmark(p_engine, description_token);

     }

     catch (...)

     {

         if (retval)

             delete retval;

         throw;

     }


     return retval;

 }


 void BenchmarkDescriptor::destroyBenchmark(PartialBenchmark *p_bench)

 {

     assert(m_b_registered);

     if (p_bench)

         delete p_bench;

 }


 //-----------------

 // class Benchmark

 //-----------------


 Benchmark::Benchmark(std::shared_ptr<Engine> p_engine,

                      const IBenchmarkDescriptor::DescriptionToken &description_token) :

     BenchmarkLatency(p_engine, description_token)

 {

 }


 void Benchmark::init()

 {

     hebench::Common::EventTimer timer;

     hebench::Common::TimingReportEvent::Ptr p_timing_event;

     std::uint64_t batch_sizes[BenchmarkDescriptor::OpParameterCount];

     std::stringstream ss;


     std::array<std::pair<std::uint64_t, std::uint64_t>, BenchmarkDescriptor::OpParameterCount> mat_dims =

         BenchmarkDescriptor::fetchMatrixSizes(this->getBenchmarkConfiguration().w_params);

     for (std::size_t param_i = 0; param_i < BenchmarkDescriptor::OpParameterCount; ++param_i)

         batch_sizes[param_i] = BenchmarkDescriptor::DefaultBatchSize;


     std::cout << IOS_MSG_INFO << hebench::Logging::GlobalLogger::log("Preparing workload.") << std::endl;


     timer.start();

     if (this->getBenchmarkConfiguration().dataset_filename.empty())

     {

         // generates random matrices for input and generates (computes) ground truth

         std::cout << IOS_MSG_INFO << hebench::Logging::GlobalLogger::log("Generating data...") << std::endl;

         m_data = DataLoader::create(mat_dims[0].first, mat_dims[0].second, // M0

                                     mat_dims[1].second, // M1

                                     batch_sizes[0], batch_sizes[1],

                                     this->getBackendDescription().descriptor.data_type);

     } // end if

     else

     {

         std::stringstream ss;

         ss << "Loading data from external dataset: " << std::endl

            << "\"" << this->getBenchmarkConfiguration().dataset_filename << "\"";

         std::cout << IOS_MSG_INFO << hebench::Logging::GlobalLogger::log(ss.str()) << std::endl;

         // load matrices for input and ground truth from file

         m_data = DataLoader::create(mat_dims[0].first, mat_dims[0].second, // M0

                                     mat_dims[1].second, // M1

                                     batch_sizes[0], batch_sizes[1],

                                     this->getBackendDescription().descriptor.data_type,

                                     this->getBenchmarkConfiguration().dataset_filename);

     } // end else

     p_timing_event = timer.stop<std::milli>();


     ss = std::stringstream();

     ss << "Total data loaded: " << m_data->getTotalDataLoaded() << " bytes";

     std::cout << IOS_MSG_DONE << hebench::Logging::GlobalLogger::log(ss.str()) << std::endl;

     ss = std::stringstream();

     ss << "Elapsed wall time: " << p_timing_event->elapsedWallTime<std::milli>() << " ms";

     std::cout << IOS_MSG_INFO << hebench::Logging::GlobalLogger::log(ss.str()) << std::endl;

     ss = std::stringstream();

     ss << "Elapsed CPU time: " << p_timing_event->elapsedCPUTime<std::milli>() << " ms";

     std::cout << IOS_MSG_INFO << hebench::Logging::GlobalLogger::log(ss.str()) << std::endl;

 }


 bool Benchmark::validateResult(IDataLoader::Ptr dataset,

                                const std::uint64_t *param_data_pack_indices,

                                const std::vector<hebench::APIBridge::NativeDataBuffer *> &outputs,

                                hebench::APIBridge::DataType data_type) const

 {

     assert(dataset->getParameterCount() == BenchmarkDescriptorCategory::OpParameterCount

            && dataset->getResultCount() == BenchmarkDescriptorCategory::OpResultCount);


     return BenchmarkLatency::validateResult(dataset, param_data_pack_indices, outputs, data_type);

 }


 } // namespace Latency

 } // namespace MatrixMultiply

 } // namespace TestHarness

 } // namespace hebench

api.h

hebench::TestHarness::BenchmarkDescription::Backend
Definition: hebench_benchmark_description.h:27

hebench::TestHarness::BenchmarkDescription::Configuration
Specifies a benchmark configuration.
Definition: hebench_benchmark_description.h:107

hebench::TestHarness::BenchmarkDescription::Configuration::w_params
std::vector< hebench::APIBridge::WorkloadParam > w_params
Set of arguments for workload parameters.
Definition: hebench_benchmark_description.h:151

hebench::TestHarness::BenchmarkDescription::Configuration::dataset_filename
std::string dataset_filename
File containing data for the benchmark. If empty string, benchmarks that can auto generate the datase...
Definition: hebench_benchmark_description.h:140

hebench::TestHarness::BenchmarkFactory::registerSupportedBenchmark
static bool registerSupportedBenchmark(std::shared_ptr< IBenchmarkDescriptor > p_desc_obj)
Registers a benchmark description object that represents one of the supported workloads.
Definition: hebench_benchmark_factory.cpp:90

hebench::TestHarness::BenchmarkLatency
Base class for workload benchmarks in the latency category.
Definition: hebench_benchmark_latency.h:30

hebench::TestHarness::Engine
Definition: hebench_engine.h:23

hebench::TestHarness::IBenchmarkDescriptor::DescriptionToken
Token returned by a successful call to IBenchmarkDescriptor::matchBenchmarkDescriptor().
Definition: hebench_ibenchmark.h:60

hebench::TestHarness::IDataLoader::Ptr
std::shared_ptr< IDataLoader > Ptr
Definition: hebench_idata_loader.h:48

hebench::TestHarness::MatrixMultiply::BenchmarkDescriptorCategory::fetchMatrixSizes
static std::array< std::pair< std::uint64_t, std::uint64_t >, OpParameterCount > fetchMatrixSizes(const std::vector< hebench::APIBridge::WorkloadParam > &w_params)
fetchMatrixSizes
Definition: hebench_matmult.cpp:27

hebench::TestHarness::MatrixMultiply::BenchmarkDescriptorCategory::matchBenchmarkDescriptor
bool matchBenchmarkDescriptor(const hebench::APIBridge::BenchmarkDescriptor &bench_desc, const std::vector< hebench::APIBridge::WorkloadParam > &w_params) const override
Determines if the represented benchmark can perform the workload described by a specified HEBench ben...
Definition: hebench_matmult.cpp:92

hebench::TestHarness::MatrixMultiply::BenchmarkDescriptorCategory::OpParameterCount
static constexpr std::uint64_t OpParameterCount
Definition: hebench_matmult.h:36

hebench::TestHarness::MatrixMultiply::BenchmarkDescriptorCategory::completeWorkloadDescription
void completeWorkloadDescription(WorkloadDescriptionOutput &output, const Engine &engine, const BenchmarkDescription::Backend &backend_desc, const BenchmarkDescription::Configuration &config) const override
Completes the description for the matched benchmark.
Definition: hebench_matmult.cpp:66

hebench::TestHarness::MatrixMultiply::BenchmarkDescriptorCategory::OpResultCount
static constexpr std::uint64_t OpResultCount
Definition: hebench_matmult.h:37

hebench::TestHarness::MatrixMultiply::DataLoader::create
static DataLoader::Ptr create(std::uint64_t rows_a, std::uint64_t cols_a, std::uint64_t cols_b, std::uint64_t batch_size_mat_a, std::uint64_t batch_size_mat_b, hebench::APIBridge::DataType data_type)
Definition: hebench_matmult.cpp:214

hebench::TestHarness::MatrixMultiply::Latency::BenchmarkDescriptor::DefaultBatchSize
static constexpr std::uint64_t DefaultBatchSize
Definition: hebench_matmult_l.h:31

hebench::TestHarness::MatrixMultiply::Latency::BenchmarkDescriptor::matchBenchmarkDescriptor
bool matchBenchmarkDescriptor(const hebench::APIBridge::BenchmarkDescriptor &bench_desc, const std::vector< hebench::APIBridge::WorkloadParam > &w_params) const override
Determines if the represented benchmark can perform the workload described by a specified HEBench ben...
Definition: hebench_matmult_l.cpp:35

hebench::TestHarness::MatrixMultiply::Latency::BenchmarkDescriptor::completeWorkloadDescription
void completeWorkloadDescription(WorkloadDescriptionOutput &output, const Engine &engine, const BenchmarkDescription::Backend &backend_desc, const BenchmarkDescription::Configuration &config) const override
Completes the description for the matched benchmark.
Definition: hebench_matmult_l.cpp:49

hebench::TestHarness::MatrixMultiply::Latency::BenchmarkDescriptor::createBenchmark
hebench::TestHarness::PartialBenchmark * createBenchmark(std::shared_ptr< Engine > p_engine, const DescriptionToken &description_token) override
Creates the represented IBenchmark object that can perform the workload specified by the HEBench benc...
Definition: hebench_matmult_l.cpp:88

hebench::TestHarness::MatrixMultiply::Latency::BenchmarkDescriptor::destroyBenchmark
void destroyBenchmark(hebench::TestHarness::PartialBenchmark *p_bench) override
Destroys an object returned by createBenchmark().
Definition: hebench_matmult_l.cpp:108

hebench::TestHarness::MatrixMultiply::Latency::Benchmark
Definition: hebench_matmult_l.h:54

hebench::TestHarness::MatrixMultiply::Latency::Benchmark::validateResult
bool validateResult(IDataLoader::Ptr dataset, const std::uint64_t *param_data_pack_indices, const std::vector< hebench::APIBridge::NativeDataBuffer * > &p_outputs, hebench::APIBridge::DataType data_type) const override
Validates the result of an operation against the ground truth.
Definition: hebench_matmult_l.cpp:175

hebench::TestHarness::MatrixMultiply::Latency::Benchmark::init
void init() override
Initializes the partial benchmark members.
Definition: hebench_matmult_l.cpp:125

hebench::TestHarness::PartialBenchmarkCategory::validateResult
virtual bool validateResult(IDataLoader::Ptr dataset, const std::uint64_t *param_data_pack_indices, const std::vector< hebench::APIBridge::NativeDataBuffer * > &outputs, hebench::APIBridge::DataType data_type) const
Validates the result of an operation against the ground truth.
Definition: hebench_benchmark_category.cpp:94

hebench::TestHarness::PartialBenchmarkDescriptor::WorkloadDescriptionOutput::workload_header
std::string workload_header
Workload specific information to be added to the report header.
Definition: hebench_ibenchmark.h:318

hebench::TestHarness::PartialBenchmarkDescriptor::WorkloadDescriptionOutput::operation_params_count
std::size_t operation_params_count
Number of parameters for the represented workload operation.
Definition: hebench_ibenchmark.h:298

hebench::TestHarness::PartialBenchmarkDescriptor::WorkloadDescriptionOutput
Bundles values that need to be filled by a workload during completeWorkloadDescription().
Definition: hebench_ibenchmark.h:294

hebench::TestHarness::PartialBenchmark
Base class for benchmarks.
Definition: hebench_ibenchmark.h:500

hebench::TestHarness::PartialBenchmark::getBackendDescription
const BenchmarkDescription::Backend & getBackendDescription() const
Allows read-only access to this benchmark backend description.
Definition: hebench_ibenchmark.h:608

hebench::TestHarness::PartialBenchmark::getBenchmarkConfiguration
const BenchmarkDescription::Configuration & getBenchmarkConfiguration() const
Allows read-only access to this benchmark configuration.
Definition: hebench_ibenchmark.h:612

hebench_engine.h

IOS_MSG_DONE
#define IOS_MSG_DONE
Definition: hebench_types_harness.h:18

IOS_MSG_INFO
#define IOS_MSG_INFO
Definition: hebench_types_harness.h:22

hebench::APIBridge::DataType
DataType
Defines data types for a workload.
Definition: types.h:379

hebench::APIBridge::Latency
@ Latency
Definition: types.h:393

hebench::APIBridge::BenchmarkDescriptor::category
Category category
Category for the benchmark.
Definition: types.h:531

hebench::APIBridge::MatrixMultiply
@ MatrixMultiply
Definition: types.h:104

hebench::APIBridge::BenchmarkDescriptor
Defines a benchmark test.
Definition: types.h:527

hebench
Definition: hebench_benchmark_category.h:18