From 943c57a26c4644cca92da6f9ec256dd7280f381b Mon Sep 17 00:00:00 2001 From: Prasanth Nunna Date: Thu, 9 May 2024 23:56:04 +0000 Subject: [PATCH] Sync files with upstream --- include/Algo-Direct2.h | 16 ++++++++-------- include/SIMD.h | 4 ++-- 2 files changed, 10 insertions(+), 10 deletions(-) diff --git a/include/Algo-Direct2.h b/include/Algo-Direct2.h index 91dded6f4..547ca9955 100644 --- a/include/Algo-Direct2.h +++ b/include/Algo-Direct2.h @@ -94,8 +94,8 @@ struct AlgoVecBase::val __m128 vxp = _mm_shuffle_ps(xp01, xp23, (1) + (3 << 2) + (1 << 4) + (3 << 6)); #endif IVec i(u.vec); - IVec vlem = operator< (vz, vxm); - IVec vlep = operator< (vz, vxp); + IVec vlem = vz < vxm; + IVec vlep = vz < vxp; i = i + vlem + vlep; i.store(pr); } @@ -124,8 +124,8 @@ struct AlgoVecBase::val __m128d vxp = _mm_shuffle_pd(vx0, vx1, 3); IVec i(b1, b0); - IVec vlem = operator< (vz, vxm); - IVec vlep = operator< (vz, vxp); + IVec vlem = (vz < vxm); + IVec vlep = (vz < vxp); i = i + vlem + vlep; union { @@ -229,8 +229,8 @@ struct AlgoVecBase::val #endif - IVec vlem = operator< (vz, vxm); - IVec vlep = operator< (vz, vxp); + IVec vlem = vz < vxm; + IVec vlep = vz < vxp; ip = ip + vlem + vlep; ip.store(pr); @@ -279,8 +279,8 @@ struct AlgoVecBase::val // FVec vxp = _mm256_insertf128_pd(_mm256_castpd128_pd256(h01p), h23p, 1); IVec i(u.vec); - IVec vlem = operator< (vz, vxm); - IVec vlep = operator< (vz, vxp); + IVec vlem = vz < vxm; + IVec vlep = vz < vxp; i = i + vlem + vlep; i.extractLo32s().store(pr); } diff --git a/include/SIMD.h b/include/SIMD.h index e97f5fc33..9d1410c73 100644 --- a/include/SIMD.h +++ b/include/SIMD.h @@ -307,7 +307,7 @@ FORCE_INLINE FVec operator- (const FVec& a, const FVec< FORCE_INLINE FVec operator* (const FVec& a, const FVec& b) { return _mm_mul_ps( a, b ); } FORCE_INLINE FVec operator/ (const FVec& a, const FVec& b) { return _mm_div_ps( a, b ); } FORCE_INLINE IVec ftoi (const FVec& a) { return _mm_cvttps_epi32(a); } -#if !defined(__clang__) || defined(__HIP_PLATFORM_AMD__) // Conflicts with builtin operator +#ifndef __clang__ // Conflicts with builtin operator FORCE_INLINE IVec operator<= (const FVec& a, const FVec& b) { return _mm_castps_si128( _mm_cmple_ps( a, b ) ); } FORCE_INLINE IVec operator>= (const FVec& a, const FVec& b) { return _mm_castps_si128( _mm_cmpge_ps( a, b ) ); } FORCE_INLINE IVec operator< (const FVec& a, const FVec& b) { return _mm_castps_si128(_mm_cmplt_ps(a, b)); } @@ -363,7 +363,7 @@ FORCE_INLINE FVec operator- (const FVec& a, const FVec FORCE_INLINE FVec operator* (const FVec& a, const FVec& b) { return _mm_mul_pd( a, b ); } FORCE_INLINE FVec operator/ (const FVec& a, const FVec& b) { return _mm_div_pd( a, b ); } FORCE_INLINE IVec ftoi (const FVec& a) { return _mm_cvttpd_epi32(a); } -#if !defined(__clang__) || defined(__HIP_PLATFORM_AMD__) // Conflicts with builtin operator +#ifndef __clang__ // Conflicts with builtin operator FORCE_INLINE IVec operator<= (const FVec& a, const FVec& b) { return _mm_castpd_si128( _mm_cmple_pd( a, b ) ); } FORCE_INLINE IVec operator< (const FVec& a, const FVec& b) { return _mm_castpd_si128(_mm_cmplt_pd(a, b)); } FORCE_INLINE IVec operator>= (const FVec& a, const FVec& b) { return _mm_castpd_si128( _mm_cmpge_pd( a, b ) ); }