Skip to content

Commit

Permalink
warp: use SSE4.1 code path with AVX
Browse files Browse the repository at this point in the history
  • Loading branch information
rouault committed Nov 10, 2024
1 parent db73dcc commit 0642738
Showing 1 changed file with 2 additions and 2 deletions.
4 changes: 2 additions & 2 deletions alg/gdalwarpkernel.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -2995,7 +2995,7 @@ static CPL_INLINE __m128 XMMLoad4Values(const GByte *ptr)
__m128i xmm_i = _mm_cvtsi32_si128(i);
// Zero extend 4 packed unsigned 8-bit integers in a to packed
// 32-bit integers.
#if defined(__SSE4_1__) || defined(USE_NEON_OPTIMIZATIONS)
#if defined(__SSE4_1__) || defined(__AVX__) || defined(USE_NEON_OPTIMIZATIONS)
xmm_i = _mm_cvtepu8_epi32(xmm_i);
#else
xmm_i = _mm_unpacklo_epi8(xmm_i, _mm_setzero_si128());
Expand All @@ -3011,7 +3011,7 @@ static CPL_INLINE __m128 XMMLoad4Values(const GUInt16 *ptr)
__m128i xmm_i = _mm_cvtsi64_si128(i);
// Zero extend 4 packed unsigned 16-bit integers in a to packed
// 32-bit integers.
#if defined(__SSE4_1__) || defined(USE_NEON_OPTIMIZATIONS)
#if defined(__SSE4_1__) || defined(__AVX__) || defined(USE_NEON_OPTIMIZATIONS)
xmm_i = _mm_cvtepu16_epi32(xmm_i);
#else
xmm_i = _mm_unpacklo_epi16(xmm_i, _mm_setzero_si128());
Expand Down

0 comments on commit 0642738

Please sign in to comment.