30 MultRunData RunImpMultInputsBp::RunEvalImpMultDataSets(
32 size_t data_type_size)
const
35 return RunEvalImpMultDataSets<run_environment::AccSetting::kCUDA>(run_imp_settings, data_type_size);
38 return RunEvalImpMultDataSets<run_environment::AccSetting::kAVX512>(run_imp_settings, data_type_size);
41 return RunEvalImpMultDataSets<run_environment::AccSetting::kAVX512_F16>(run_imp_settings, data_type_size);
44 return RunEvalImpMultDataSets<run_environment::AccSetting::kAVX256>(run_imp_settings, data_type_size);
47 return RunEvalImpMultDataSets<run_environment::AccSetting::kAVX256_F16>(run_imp_settings, data_type_size);
50 return RunEvalImpMultDataSets<run_environment::AccSetting::kNEON>(run_imp_settings, data_type_size);
53 return RunEvalImpMultDataSets<run_environment::AccSetting::kNone>(run_imp_settings, data_type_size);
56 template <run_environment::AccSetting OPT_IMP_ACCEL>
57 MultRunData RunImpMultInputsBp::RunEvalImpMultDataSets(
59 size_t data_type_size)
const
61 if (data_type_size ==
sizeof(
float)) {
62 return RunEvalImpMultDataSets<float, OPT_IMP_ACCEL>(run_imp_settings);
64 else if (data_type_size ==
sizeof(
double)) {
65 return RunEvalImpMultDataSets<double, OPT_IMP_ACCEL>(run_imp_settings);
71 #if (defined(OPTIMIZED_CPU_RUN) && (!(defined(COMPILING_FOR_ARM))))
75 return RunEvalImpMultDataSets<short, OPT_IMP_ACCEL>(run_imp_settings);
77 #if defined(FLOAT16_VECTORIZATION)
82 std::cout <<
"FLOAT16 USED" << std::endl;
83 return RunEvalImpMultDataSets<_Float16, OPT_IMP_ACCEL>(run_imp_settings);
87 return RunEvalImpMultDataSets<halftype, OPT_IMP_ACCEL>(run_imp_settings);
92 template <RunData_t T, run_environment::AccSetting OPT_IMP_ACCEL>
93 MultRunData RunImpMultInputsBp::RunEvalImpMultDataSets(
97 std::vector<MultRunData> run_results;
103 #ifndef SMALLER_SETS_ONLY
110 for (
auto& run_result : run_results) {
111 run_data_all_runs.merge(run_result);
114 return run_data_all_runs;
std::map< InputSignature, std::optional< std::map< run_environment::ParallelParamsSetting, RunData > >> MultRunData
Alias mapping input signature to run data for each parallel parameters setting Run data is null if r...
Structure that stores settings for current implementation run.