mirror of
https://github.com/CNugteren/CLBlast.git
synced 2024-07-07 12:23:46 +02:00
Fixed an issue with computing the GFLOPS numbers for the xGEMM performance tests for non-square matrices
This commit is contained in:
parent
ed2904a344
commit
1acb31896c
|
@ -153,10 +153,10 @@ class TestXgemm {
|
|||
|
||||
// Describes how to compute performance metrics
|
||||
static size_t GetFlops(const Arguments<T> &args) {
|
||||
return 2 * args.m * args.n * args.m;
|
||||
return 2 * args.m * args.n * args.k;
|
||||
}
|
||||
static size_t GetBytes(const Arguments<T> &args) {
|
||||
return (args.m*args.m + args.m*args.n + 2*args.m*args.n) * sizeof(T);
|
||||
return (args.m*args.k + args.k*args.n + 2*args.m*args.n) * sizeof(T);
|
||||
}
|
||||
};
|
||||
|
||||
|
|
Loading…
Reference in a new issue