Skip to content

Commit

Permalink
HOLY CRAP t590 WORKS WITH CUDA GEN
Browse files Browse the repository at this point in the history
  • Loading branch information
jeremylt committed Dec 12, 2024
1 parent 66c3c7c commit 6ed6b16
Showing 1 changed file with 1 addition and 1 deletion.
2 changes: 1 addition & 1 deletion backends/cuda-gen/ceed-cuda-gen-operator-build.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -580,7 +580,7 @@ static int CeedOperatorBuildKernelQFunction_Cuda_gen(std::ostringstream &code, C
code << "\n // Note: Using batches of points\n";
code << " const CeedInt point_loop_bound = (blockDim.x * blockDim.y) * ceil(1.0 * max_num_points / (blockDim.x * blockDim.y));\n\n";
code << " #pragma unroll\n";
code << " for (CeedInt i = 0; i < point_loop_bound; i++) {\n";
code << " for (CeedInt i = threadIdx.x + threadIdx.y * blockDim.x; i < point_loop_bound; i += blockDim.x * blockDim.y) {\n";
code << " const CeedInt p = i % max_num_points;\n\n";

code << " // -- Coordinates\n";
Expand Down

0 comments on commit 6ed6b16

Please sign in to comment.