We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 73b28c8 commit c23ab7fCopy full SHA for c23ab7f
src/CUDAKernels.jl
@@ -145,9 +145,10 @@ end
145
end
146
147
@device_override @inline function KA.__index_Global_Linear(ctx)
148
- I = @inbounds KA.expand(KA.__iterspace(ctx), blockIdx().x, threadIdx().x)
+ # I = @inbounds KA.expand(KA.__iterspace(ctx), blockIdx().x, threadIdx().x)
149
+ return (blockIdx().x-1) * blockDim().x + threadIdx().x
150
# TODO: This is unfortunate, can we get the linear index cheaper
- @inbounds LinearIndices(KA.__ndrange(ctx))[I]
151
+ # @inbounds LinearIndices(KA.__ndrange(ctx))[I]
152
153
154
@device_override @inline function KA.__index_Local_Cartesian(ctx)
0 commit comments