Skip to content

Commit

Permalink
Merge pull request #8570 from gmarkall/release0.56-fix
Browse files Browse the repository at this point in the history
Release 0.56 branch: Fix overloads with `target="generic"` for CUDA
  • Loading branch information
esc committed Nov 2, 2022
2 parents 463dcd9 + 4c4e319 commit 288a38b
Showing 1 changed file with 10 additions and 8 deletions.
18 changes: 10 additions & 8 deletions numba/cuda/compiler.py
Expand Up @@ -207,14 +207,16 @@ def compile_cuda(pyfunc, return_type, args, debug=False, lineinfo=False,
flags.nvvm_options = nvvm_options

# Run compilation pipeline
cres = compiler.compile_extra(typingctx=typingctx,
targetctx=targetctx,
func=pyfunc,
args=args,
return_type=return_type,
flags=flags,
locals={},
pipeline_class=CUDACompiler)
from numba.core.target_extension import target_override
with target_override('cuda'):
cres = compiler.compile_extra(typingctx=typingctx,
targetctx=targetctx,
func=pyfunc,
args=args,
return_type=return_type,
flags=flags,
locals={},
pipeline_class=CUDACompiler)

library = cres.library
library.finalize()
Expand Down

0 comments on commit 288a38b

Please sign in to comment.