Skip to content
Snippets Groups Projects

Vectorization improvements

Merged Michael Kuron requested to merge ppc into master
1 file
+ 2
2
Compare changes
  • Side-by-side
  • Inline
@@ -16,7 +16,7 @@
@@ -16,7 +16,7 @@
#include <arm_neon.h>
#include <arm_neon.h>
#endif
#endif
#ifdef __powerpc__
#if defined(__powerpc__) && defined(__GNUC__) && !defined(__clang__) && !defined(__ibmxl__)
#include <ppu_intrinsics.h>
#include <ppu_intrinsics.h>
#endif
#endif
#ifdef __ALTIVEC__
#ifdef __ALTIVEC__
@@ -46,7 +46,7 @@ QUALIFIERS uint32 mulhilo32(uint32 a, uint32 b, uint32* hip)
@@ -46,7 +46,7 @@ QUALIFIERS uint32 mulhilo32(uint32 a, uint32 b, uint32* hip)
{
{
#ifndef __CUDA_ARCH__
#ifndef __CUDA_ARCH__
// host code
// host code
#ifdef __powerpc__
#if defined(__powerpc__) && (!defined(__clang__) || defined(__ibmxl__))
*hip = __mulhwu(a,b);
*hip = __mulhwu(a,b);
return a*b;
return a*b;
#else
#else
Loading