Skip to content

Commit

Permalink
svml: require AVX not SSE for {i,u}divrem_epi32
Browse files Browse the repository at this point in the history
The IIG says that only SSE is required, but due to the types being
__m256i ICC will actually use AVX instructions even if the
implementations don't use AVX.
  • Loading branch information
nemequ committed Jun 22, 2020
1 parent ec3d983 commit 2931676
Showing 1 changed file with 2 additions and 2 deletions.
4 changes: 2 additions & 2 deletions x86/svml.h
Original file line number Diff line number Diff line change
Expand Up @@ -3803,7 +3803,7 @@ simde_mm_idivrem_epi32 (simde__m128i* mem_addr, simde__m128i a, simde__m128i b)
SIMDE_FUNCTION_ATTRIBUTES
simde__m256i
simde_mm256_idivrem_epi32 (simde__m256i* mem_addr, simde__m256i a, simde__m256i b) {
#if defined(SIMDE_X86_SVML_NATIVE) && defined(SIMDE_X86_SSE2_NATIVE)
#if defined(SIMDE_X86_SVML_NATIVE) && defined(SIMDE_X86_AVX_NATIVE)
return _mm256_idivrem_epi32(HEDLEY_REINTERPRET_CAST(__m256i*, mem_addr), a, b);
#else
simde__m256i r;
Expand Down Expand Up @@ -7147,7 +7147,7 @@ simde_mm_udivrem_epi32 (simde__m128i * mem_addr, simde__m128i a, simde__m128i b)
SIMDE_FUNCTION_ATTRIBUTES
simde__m256i
simde_mm256_udivrem_epi32 (simde__m256i* mem_addr, simde__m256i a, simde__m256i b) {
#if defined(SIMDE_X86_SVML_NATIVE) && defined(SIMDE_X86_SSE2_NATIVE)
#if defined(SIMDE_X86_SVML_NATIVE) && defined(SIMDE_X86_AVX_NATIVE)
return _mm256_udivrem_epi32(HEDLEY_REINTERPRET_CAST(__m256i*, mem_addr), a, b);
#else
simde__m256i r;
Expand Down

0 comments on commit 2931676

Please sign in to comment.