Skip to content

Commit

Permalink
Merge pull request #631 from sergeyvfx/div
Browse files Browse the repository at this point in the history
Fix with _mm_div_ps when SSE2NEON_PRECISE_DIV=1
  • Loading branch information
jserv committed May 14, 2024
2 parents ab7a347 + 85edff9 commit de0538f
Showing 1 changed file with 2 additions and 2 deletions.
4 changes: 2 additions & 2 deletions sse2neon.h
Original file line number Diff line number Diff line change
Expand Up @@ -62,7 +62,7 @@
#ifndef SSE2NEON_PRECISE_MINMAX
#define SSE2NEON_PRECISE_MINMAX (0)
#endif
/* _mm_rcp_ps and _mm_div_ps */
/* _mm_rcp_ps */
#ifndef SSE2NEON_PRECISE_DIV
#define SSE2NEON_PRECISE_DIV (0)
#endif
Expand Down Expand Up @@ -1724,7 +1724,7 @@ FORCE_INLINE int64_t _mm_cvttss_si64(__m128 a)
// https://www.intel.com/content/www/us/en/docs/intrinsics-guide/index.html#text=_mm_div_ps
FORCE_INLINE __m128 _mm_div_ps(__m128 a, __m128 b)
{
#if (defined(__aarch64__) || defined(_M_ARM64)) && !SSE2NEON_PRECISE_DIV
#if defined(__aarch64__) || defined(_M_ARM64)
return vreinterpretq_m128_f32(
vdivq_f32(vreinterpretq_f32_m128(a), vreinterpretq_f32_m128(b)));
#else
Expand Down

0 comments on commit de0538f

Please sign in to comment.