Skip to content

Commit f141256

Browse files
authored
Merge pull request rapidsai#34 from sklam/fix/iss32
Use better gridsize calc to avoid cuda launch error
2 parents 916fe3d + 693d55f commit f141256

File tree

2 files changed

+7
-2
lines changed

2 files changed

+7
-2
lines changed

src/binaryops.cu

Lines changed: 4 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,5 @@
1+
#include <algorithm>
2+
13
#include <gdf/gdf.h>
24
#include <gdf/utils.h>
35
#include <gdf/errorutils.h>
@@ -41,7 +43,8 @@ struct BinaryOp {
4143
gpu_binary_op<T, Tout, F>)
4244
);
4345
// find needed gridsize
44-
int gridsize = (lhs->size + blocksize - 1) / blocksize;
46+
int neededgridsize = (lhs->size + blocksize - 1) / blocksize;
47+
int gridsize = std::min(mingridsize, neededgridsize);
4548

4649
F functor;
4750
gpu_binary_op<<<gridsize, blocksize>>>(

src/unaryops.cu

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,5 @@
11
#include <cmath>
2+
#include <algorithm>
23

34
#include <gdf/gdf.h>
45
#include <gdf/utils.h>
@@ -43,7 +44,8 @@ struct UnaryOp {
4344
gpu_unary_op<T, Tout, F>)
4445
);
4546
// find needed gridsize
46-
int gridsize = (input->size + blocksize - 1) / blocksize;
47+
int neededgridsize = (input->size + blocksize - 1) / blocksize;
48+
int gridsize = std::min(neededgridsize, mingridsize);
4749

4850
F functor;
4951
gpu_unary_op<<<gridsize, blocksize>>>(

0 commit comments

Comments
 (0)