Increased the default number of runs for the tuner from 2 up to 10 for fast kernels
parent
192199c9cb
commit
3eea8dc998
|
@ -48,7 +48,7 @@ class TuneCopy {
|
|||
static size_t DefaultK() { return 1; } // N/A for this kernel
|
||||
static size_t DefaultBatchCount() { return 1; } // N/A for this kernel
|
||||
static double DefaultFraction() { return 1.0; } // N/A for this kernel
|
||||
static size_t DefaultNumRuns() { return 2; } // run every kernel this many times for averaging
|
||||
static size_t DefaultNumRuns() { return 10; } // run every kernel this many times for averaging
|
||||
|
||||
// Describes how to obtain the sizes of the buffers
|
||||
static size_t GetSizeX(const Arguments<T> &) { return 1; } // N/A for this kernel
|
||||
|
|
|
@ -48,7 +48,7 @@ class TunePad {
|
|||
static size_t DefaultK() { return 1; } // N/A for this kernel
|
||||
static size_t DefaultBatchCount() { return 1; } // N/A for this kernel
|
||||
static double DefaultFraction() { return 1.0; } // N/A for this kernel
|
||||
static size_t DefaultNumRuns() { return 2; } // run every kernel this many times for averaging
|
||||
static size_t DefaultNumRuns() { return 10; } // run every kernel this many times for averaging
|
||||
|
||||
// Describes how to obtain the sizes of the buffers
|
||||
static size_t GetSizeX(const Arguments<T> &) { return 1; } // N/A for this kernel
|
||||
|
|
|
@ -48,7 +48,7 @@ class TuneTranspose {
|
|||
static size_t DefaultK() { return 1; } // N/A for this kernel
|
||||
static size_t DefaultBatchCount() { return 1; } // N/A for this kernel
|
||||
static double DefaultFraction() { return 1.0; } // N/A for this kernel
|
||||
static size_t DefaultNumRuns() { return 2; } // run every kernel this many times for averaging
|
||||
static size_t DefaultNumRuns() { return 10; } // run every kernel this many times for averaging
|
||||
|
||||
// Describes how to obtain the sizes of the buffers
|
||||
static size_t GetSizeX(const Arguments<T> &) { return 1; } // N/A for this kernel
|
||||
|
|
|
@ -48,7 +48,7 @@ class TunePadTranspose {
|
|||
static size_t DefaultK() { return 1; } // N/A for this kernel
|
||||
static size_t DefaultBatchCount() { return 1; } // N/A for this kernel
|
||||
static double DefaultFraction() { return 1.0; } // N/A for this kernel
|
||||
static size_t DefaultNumRuns() { return 2; } // run every kernel this many times for averaging
|
||||
static size_t DefaultNumRuns() { return 10; } // run every kernel this many times for averaging
|
||||
|
||||
// Describes how to obtain the sizes of the buffers
|
||||
static size_t GetSizeX(const Arguments<T> &) { return 1; } // N/A for this kernel
|
||||
|
|
|
@ -48,7 +48,7 @@ class TuneXdot {
|
|||
static size_t DefaultK() { return 1; } // N/A for this kernel
|
||||
static size_t DefaultBatchCount() { return 1; } // N/A for this kernel
|
||||
static double DefaultFraction() { return 1.0; } // N/A for this kernel
|
||||
static size_t DefaultNumRuns() { return 2; } // run every kernel this many times for averaging
|
||||
static size_t DefaultNumRuns() { return 10; } // run every kernel this many times for averaging
|
||||
|
||||
// Describes how to obtain the sizes of the buffers
|
||||
static size_t GetSizeX(const Arguments<T> &args) { return args.n; }
|
||||
|
|
|
@ -193,7 +193,7 @@ void StartVariation(int argc, char *argv[]) {
|
|||
// Main function (not within the clblast namespace)
|
||||
int main(int argc, char *argv[]) {
|
||||
StartVariation<1>(argc, argv);
|
||||
StartVariation<2>(argc, argv);
|
||||
//StartVariation<2>(argc, argv);
|
||||
return 0;
|
||||
}
|
||||
|
||||
|
|
|
@ -48,7 +48,7 @@ class TuneXger {
|
|||
static size_t DefaultK() { return 1; } // N/A for this kernel
|
||||
static size_t DefaultBatchCount() { return 1; } // N/A for this kernel
|
||||
static double DefaultFraction() { return 1.0; } // N/A for this kernel
|
||||
static size_t DefaultNumRuns() { return 2; } // run every kernel this many times for averaging
|
||||
static size_t DefaultNumRuns() { return 10; } // run every kernel this many times for averaging
|
||||
|
||||
// Describes how to obtain the sizes of the buffers
|
||||
static size_t GetSizeX(const Arguments<T> &args) { return args.m; }
|
||||
|
|
Loading…
Reference in New Issue