mirror of
https://github.com/CNugteren/CLBlast.git
synced 2024-07-04 21:36:57 +02:00
Merge pull request #368 from etomzak/master
Fix out-of-bounds read/write in XhadFaster
This commit is contained in:
commit
701ac9bf76
|
@ -97,10 +97,12 @@ void XhadFaster(const int n, const real_arg arg_alpha, const real_arg arg_beta,
|
||||||
const real alpha = GetRealArg(arg_alpha);
|
const real alpha = GetRealArg(arg_alpha);
|
||||||
const real beta = GetRealArg(arg_beta);
|
const real beta = GetRealArg(arg_beta);
|
||||||
|
|
||||||
if (get_global_id(0) < n / (VW)) {
|
const int num_desired_threads = n / (VW * WPT);
|
||||||
|
|
||||||
|
if (get_global_id(0) < num_desired_threads) {
|
||||||
#pragma unroll
|
#pragma unroll
|
||||||
for (int _w = 0; _w < WPT; _w += 1) {
|
for (int _w = 0; _w < WPT; _w += 1) {
|
||||||
const int id = _w*get_global_size(0) + get_global_id(0);
|
const int id = _w * num_desired_threads + get_global_id(0);
|
||||||
realV xvalue = xgm[id];
|
realV xvalue = xgm[id];
|
||||||
realV yvalue = ygm[id];
|
realV yvalue = ygm[id];
|
||||||
realV zvalue = zgm[id];
|
realV zvalue = zgm[id];
|
||||||
|
|
Loading…
Reference in a new issue