Added code to report the average tuning results

pull/304/head
Cedric Nugteren 2018-07-23 21:00:10 +02:00
parent f8fb707fa4
commit 6a8b9e24f2
2 changed files with 14 additions and 1 deletions

View File

@ -1,4 +1,8 @@
Development (next version)
- Added support for shuffle instructions for NVIDIA GPUs (thanks to 'tyler-utah')
- Various minor fixes and enhancements
Version 1.4.1
- Fixed an access violation under Windows upon releasing the OpenCL program when the driver is already unloaded
- Fixed an issue with double cl_program release in the CLBlast caching system

View File

@ -342,8 +342,17 @@ void Tuner(int argc, char* argv[], const int V,
const auto best_time_ms = best_configuration->score;
if (best_time_ms == 0.0) { return; }
// Also prints the performance of the best-case in terms of GB/s or GFLOPS
// Computes and prints some other statistics
auto average_ms = 0.0;
for (const auto result : results) { average_ms += result.score; }
average_ms /= results.size();
printf("\n");
printf("* Got average result of %.2lf ms", average_ms);
printf(": %.1lf %s\n", settings.metric_amount / (average_ms * 1.0e6),
settings.performance_unit.c_str());
// Also prints the performance of the best-case in terms of GB/s or GFLOPS
printf("* Found best result %.2lf ms", best_time_ms);
printf(": %.1lf %s\n", settings.metric_amount / (best_time_ms * 1.0e6),
settings.performance_unit.c_str());