diff --git a/src/pystencils/backend/platforms/cuda.py b/src/pystencils/backend/platforms/cuda.py index 73c4b3b471390e92bdf6e2ea10ecc163b8fea932..fa246c1286a048fef5386e653aa76556ed74c185 100644 --- a/src/pystencils/backend/platforms/cuda.py +++ b/src/pystencils/backend/platforms/cuda.py @@ -65,7 +65,7 @@ class CudaPlatform(GenericGpu): @property def required_headers(self) -> set[str]: - return {'"gpu_defines.h"', "<cuda/std/limits>"} + return {'"gpu_defines.h"'} def materialize_iteration_space( self, body: PsBlock, ispace: IterationSpace @@ -85,8 +85,11 @@ class CudaPlatform(GenericGpu): arg_types = (dtype,) * func.num_args if isinstance(dtype, PsScalarType) and func in (NumericLimitsFunctions.Min, NumericLimitsFunctions.Max): + assert isinstance(dtype, PsIeeeFloatType) + defines = { NumericLimitsFunctions.Min: "NEG_INFINITY", NumericLimitsFunctions.Max: "POS_INFINITY" } + return PsLiteralExpr( - PsLiteral(f"::cuda::std::numeric_limits<{dtype.c_string()}>::{func.function_name}()", dtype)) + PsLiteral(defines[func.function_name], dtype)) if isinstance(dtype, PsIeeeFloatType): match func: