Extend Support for CUDA and HIP kernel invocations
+ 169
− 115
@@ -10,8 +10,9 @@ from pystencils.codegen.gpu_indexing import (
@@ -99,18 +100,60 @@ class SfgGpuComposer(SfgComposerMixIn):
@@ -120,134 +163,145 @@ class SfgGpuComposer(SfgComposerMixIn):