#if !defined(SIMDE_X86_AVX512_ROUNDSCALE_ROUND_H) #define SIMDE_X86_AVX512_ROUNDSCALE_ROUND_H #include "types.h" #include "roundscale.h" HEDLEY_DIAGNOSTIC_PUSH SIMDE_DISABLE_UNWANTED_DIAGNOSTICS SIMDE_BEGIN_DECLS_ #if defined(HEDLEY_MSVC_VERSION) #pragma warning( push ) #pragma warning( disable : 4244 ) #endif #if defined(SIMDE_X86_AVX512F_NATIVE) #define simde_mm512_roundscale_round_ps(a, imm8, sae) _mm512_roundscale_round_ps(a, imm8, sae) #elif defined(SIMDE_FAST_EXCEPTIONS) #define simde_mm512_roundscale_round_ps(a, imm8, sae) simde_mm512_roundscale_ps(a, imm8) #elif defined(SIMDE_STATEMENT_EXPR_) #if defined(SIMDE_HAVE_FENV_H) #define simde_mm512_roundscale_round_ps(a,imm8, sae) SIMDE_STATEMENT_EXPR_(({ \ simde__m512 simde_mm512_roundscale_round_ps_r; \ \ if (sae & SIMDE_MM_FROUND_NO_EXC) { \ fenv_t simde_mm512_roundscale_round_ps_envp; \ int simde_mm512_roundscale_round_ps_x = feholdexcept(&simde_mm512_roundscale_round_ps_envp); \ simde_mm512_roundscale_round_ps_r = simde_mm512_roundscale_ps(a, imm8); \ if (HEDLEY_LIKELY(simde_mm512_roundscale_round_ps_x == 0)) \ fesetenv(&simde_mm512_roundscale_round_ps_envp); \ } \ else { \ simde_mm512_roundscale_round_ps_r = simde_mm512_roundscale_ps(a, imm8); \ } \ \ simde_mm512_roundscale_round_ps_r; \ })) #else #define simde_mm512_roundscale_round_ps(a, imm8, sae) simde_mm512_roundscale_ps(a, imm8) #endif #else SIMDE_FUNCTION_ATTRIBUTES simde__m512 simde_mm512_roundscale_round_ps (simde__m512 a, int imm8, int sae) SIMDE_REQUIRE_RANGE(imm8, 0, 15) { simde__m512 r; if (sae & SIMDE_MM_FROUND_NO_EXC) { #if defined(SIMDE_HAVE_FENV_H) fenv_t envp; int x = feholdexcept(&envp); r = simde_mm512_roundscale_ps(a, imm8); if (HEDLEY_LIKELY(x == 0)) fesetenv(&envp); #else r = simde_mm512_roundscale_ps(a, imm8); #endif } else { r = simde_mm512_roundscale_ps(a, imm8); } return r; } #endif #if defined(SIMDE_X86_AVX512F_ENABLE_NATIVE_ALIASES) #undef _mm512_roundscale_round_ps #define _mm512_roundscale_round_ps(a, imm8, sae) simde_mm512_roundscale_round_ps(a, imm8, sae) #endif #if defined(SIMDE_X86_AVX512F_NATIVE) && !defined(SIMDE_BUG_GCC_92035) #define simde_mm512_mask_roundscale_round_ps(src, k, a, imm8, sae) _mm512_mask_roundscale_round_ps(src, k, a, imm8, sae) #elif defined(SIMDE_FAST_EXCEPTIONS) #define simde_mm512_mask_roundscale_round_ps(src, k, a, imm8, sae) simde_mm512_mask_roundscale_ps(src, k, a, imm8) #elif defined(SIMDE_STATEMENT_EXPR_) #if defined(SIMDE_HAVE_FENV_H) #define simde_mm512_mask_roundscale_round_ps(src, k, a, imm8, sae) SIMDE_STATEMENT_EXPR_(({ \ simde__m512 simde_mm512_mask_roundscale_round_ps_r; \ \ if (sae & SIMDE_MM_FROUND_NO_EXC) { \ fenv_t simde_mm512_mask_roundscale_round_ps_envp; \ int simde_mm512_mask_roundscale_round_ps_x = feholdexcept(&simde_mm512_mask_roundscale_round_ps_envp); \ simde_mm512_mask_roundscale_round_ps_r = simde_mm512_mask_roundscale_ps(src, k, a, imm8); \ if (HEDLEY_LIKELY(simde_mm512_mask_roundscale_round_ps_x == 0)) \ fesetenv(&simde_mm512_mask_roundscale_round_ps_envp); \ } \ else { \ simde_mm512_mask_roundscale_round_ps_r = simde_mm512_mask_roundscale_ps(src, k, a, imm8); \ } \ \ simde_mm512_mask_roundscale_round_ps_r; \ })) #else #define simde_mm512_mask_roundscale_round_ps(src, k, a, imm8, sae) simde_mm512_mask_roundscale_ps(src, k, a, imm8) #endif #else SIMDE_FUNCTION_ATTRIBUTES simde__m512 simde_mm512_mask_roundscale_round_ps (simde__m512 src, simde__mmask8 k, simde__m512 a, int imm8, int sae) SIMDE_REQUIRE_RANGE(imm8, 0, 15) { simde__m512 r; if (sae & SIMDE_MM_FROUND_NO_EXC) { #if defined(SIMDE_HAVE_FENV_H) fenv_t envp; int x = feholdexcept(&envp); r = simde_mm512_mask_roundscale_ps(src, k, a, imm8); if (HEDLEY_LIKELY(x == 0)) fesetenv(&envp); #else r = simde_mm512_mask_roundscale_ps(src, k, a, imm8); #endif } else { r = simde_mm512_mask_roundscale_ps(src, k, a, imm8); } return r; } #endif #if defined(SIMDE_X86_AVX512F_ENABLE_NATIVE_ALIASES) #undef _mm512_mask_roundscale_round_ps #define _mm512_mask_roundscale_round_ps(src, k, a, imm8, sae) simde_mm512_mask_roundscale_round_ps(src, k, a, imm8, sae) #endif #if defined(SIMDE_X86_AVX512F_NATIVE) && !defined(SIMDE_BUG_GCC_92035) #define simde_mm512_maskz_roundscale_round_ps(k, a, imm8, sae) _mm512_maskz_roundscale_round_ps(k, a, imm8, sae) #elif defined(SIMDE_FAST_EXCEPTIONS) #define simde_mm512_maskz_roundscale_round_ps(k, a, imm8, sae) simde_mm512_maskz_roundscale_ps(k, a, imm8) #elif defined(SIMDE_STATEMENT_EXPR_) #if defined(SIMDE_HAVE_FENV_H) #define simde_mm512_maskz_roundscale_round_ps(k, a, imm8, sae) SIMDE_STATEMENT_EXPR_(({ \ simde__m512 simde_mm512_maskz_roundscale_round_ps_r; \ \ if (sae & SIMDE_MM_FROUND_NO_EXC) { \ fenv_t simde_mm512_maskz_roundscale_round_ps_envp; \ int simde_mm512_maskz_roundscale_round_ps_x = feholdexcept(&simde_mm512_maskz_roundscale_round_ps_envp); \ simde_mm512_maskz_roundscale_round_ps_r = simde_mm512_maskz_roundscale_ps(k, a, imm8); \ if (HEDLEY_LIKELY(simde_mm512_maskz_roundscale_round_ps_x == 0)) \ fesetenv(&simde_mm512_maskz_roundscale_round_ps_envp); \ } \ else { \ simde_mm512_maskz_roundscale_round_ps_r = simde_mm512_maskz_roundscale_ps(k, a, imm8); \ } \ \ simde_mm512_maskz_roundscale_round_ps_r; \ })) #else #define simde_mm512_maskz_roundscale_round_ps(src, k, a, imm8, sae) simde_mm512_maskz_roundscale_ps(k, a, imm8) #endif #else SIMDE_FUNCTION_ATTRIBUTES simde__m512 simde_mm512_maskz_roundscale_round_ps (simde__mmask8 k, simde__m512 a, int imm8, int sae) SIMDE_REQUIRE_RANGE(imm8, 0, 15) { simde__m512 r; if (sae & SIMDE_MM_FROUND_NO_EXC) { #if defined(SIMDE_HAVE_FENV_H) fenv_t envp; int x = feholdexcept(&envp); r = simde_mm512_maskz_roundscale_ps(k, a, imm8); if (HEDLEY_LIKELY(x == 0)) fesetenv(&envp); #else r = simde_mm512_maskz_roundscale_ps(k, a, imm8); #endif } else { r = simde_mm512_maskz_roundscale_ps(k, a, imm8); } return r; } #endif #if defined(SIMDE_X86_AVX512F_ENABLE_NATIVE_ALIASES) #undef _mm512_maskz_roundscale_round_ps #define _mm512_maskz_roundscale_round_ps(k, a, imm8, sae) simde_mm512_maskz_roundscale_round_ps(k, a, imm8, sae) #endif #if defined(SIMDE_X86_AVX512F_NATIVE) #define simde_mm512_roundscale_round_pd(a, imm8, sae) _mm512_roundscale_round_pd(a, imm8, sae) #elif defined(SIMDE_FAST_EXCEPTIONS) #define simde_mm512_roundscale_round_pd(a, imm8, sae) simde_mm512_roundscale_pd(a, imm8) #elif defined(SIMDE_STATEMENT_EXPR_) #if defined(SIMDE_HAVE_FENV_H) #define simde_mm512_roundscale_round_pd(a, imm8, sae) SIMDE_STATEMENT_EXPR_(({ \ simde__m512d simde_mm512_roundscale_round_pd_r; \ \ if (sae & SIMDE_MM_FROUND_NO_EXC) { \ fenv_t simde_mm512_roundscale_round_pd_envp; \ int simde_mm512_roundscale_round_pd_x = feholdexcept(&simde_mm512_roundscale_round_pd_envp); \ simde_mm512_roundscale_round_pd_r = simde_mm512_roundscale_pd(a, imm8); \ if (HEDLEY_LIKELY(simde_mm512_roundscale_round_pd_x == 0)) \ fesetenv(&simde_mm512_roundscale_round_pd_envp); \ } \ else { \ simde_mm512_roundscale_round_pd_r = simde_mm512_roundscale_pd(a, imm8); \ } \ \ simde_mm512_roundscale_round_pd_r; \ })) #else #define simde_mm512_roundscale_round_pd(a, imm8, sae) simde_mm512_roundscale_pd(a, imm8) #endif #else SIMDE_FUNCTION_ATTRIBUTES simde__m512d simde_mm512_roundscale_round_pd (simde__m512d a, int imm8, int sae) SIMDE_REQUIRE_RANGE(imm8, 0, 15) { simde__m512d r; if (sae & SIMDE_MM_FROUND_NO_EXC) { #if defined(SIMDE_HAVE_FENV_H) fenv_t envp; int x = feholdexcept(&envp); r = simde_mm512_roundscale_pd(a, imm8); if (HEDLEY_LIKELY(x == 0)) fesetenv(&envp); #else r = simde_mm512_roundscale_pd(a, imm8); #endif } else { r = simde_mm512_roundscale_pd(a, imm8); } return r; } #endif #if defined(SIMDE_X86_AVX512F_ENABLE_NATIVE_ALIASES) #undef _mm512_roundscale_round_pd #define _mm512_roundscale_round_pd(a, imm8, sae) simde_mm512_roundscale_round_pd(a, imm8, sae) #endif #if defined(SIMDE_X86_AVX512F_NATIVE) && !defined(SIMDE_BUG_GCC_92035) #define simde_mm512_mask_roundscale_round_pd(src, k, a, imm8, sae) _mm512_mask_roundscale_round_pd(src, k, a, imm8, sae) #elif defined(SIMDE_FAST_EXCEPTIONS) #define simde_mm512_mask_roundscale_round_pd(src, k, a, imm8, sae) simde_mm512_mask_roundscale_pd(src, k, a, imm8) #elif defined(SIMDE_STATEMENT_EXPR_) #if defined(SIMDE_HAVE_FENV_H) #define simde_mm512_mask_roundscale_round_pd(src, k, a, imm8, sae) SIMDE_STATEMENT_EXPR_(({ \ simde__m512d simde_mm512_mask_roundscale_round_pd_r; \ \ if (sae & SIMDE_MM_FROUND_NO_EXC) { \ fenv_t simde_mm512_mask_roundscale_round_pd_envp; \ int simde_mm512_mask_roundscale_round_pd_x = feholdexcept(&simde_mm512_mask_roundscale_round_pd_envp); \ simde_mm512_mask_roundscale_round_pd_r = simde_mm512_mask_roundscale_pd(src, k, a, imm8); \ if (HEDLEY_LIKELY(simde_mm512_mask_roundscale_round_pd_x == 0)) \ fesetenv(&simde_mm512_mask_roundscale_round_pd_envp); \ } \ else { \ simde_mm512_mask_roundscale_round_pd_r = simde_mm512_mask_roundscale_pd(src, k, a, imm8); \ } \ \ simde_mm512_mask_roundscale_round_pd_r; \ })) #else #define simde_mm512_mask_roundscale_round_pd(src, k, a, imm8, sae) simde_mm512_mask_roundscale_pd(src, k, a, imm8) #endif #else SIMDE_FUNCTION_ATTRIBUTES simde__m512d simde_mm512_mask_roundscale_round_pd (simde__m512d src, simde__mmask8 k, simde__m512d a, int imm8, int sae) SIMDE_REQUIRE_RANGE(imm8, 0, 15) { simde__m512d r; if (sae & SIMDE_MM_FROUND_NO_EXC) { #if defined(SIMDE_HAVE_FENV_H) fenv_t envp; int x = feholdexcept(&envp); r = simde_mm512_mask_roundscale_pd(src, k, a, imm8); if (HEDLEY_LIKELY(x == 0)) fesetenv(&envp); #else r = simde_mm512_mask_roundscale_pd(src, k, a, imm8); #endif } else { r = simde_mm512_mask_roundscale_pd(src, k, a, imm8); } return r; } #endif #if defined(SIMDE_X86_AVX512F_ENABLE_NATIVE_ALIASES) #undef _mm512_mask_roundscale_round_pd #define _mm512_mask_roundscale_round_pd(src, k, a, imm8, sae) simde_mm512_mask_roundscale_round_pd(src, k, a, imm8, sae) #endif #if defined(SIMDE_X86_AVX512F_NATIVE) && !defined(SIMDE_BUG_GCC_92035) #define simde_mm512_maskz_roundscale_round_pd(k, a, imm8, sae) _mm512_maskz_roundscale_round_pd(k, a, imm8, sae) #elif defined(SIMDE_FAST_EXCEPTIONS) #define simde_mm512_maskz_roundscale_round_pd(k, a, imm8, sae) simde_mm512_maskz_roundscale_pd(k, a, imm8) #elif defined(SIMDE_STATEMENT_EXPR_) #if defined(SIMDE_HAVE_FENV_H) #define simde_mm512_maskz_roundscale_round_pd(k, a, imm8, sae) SIMDE_STATEMENT_EXPR_(({ \ simde__m512d simde_mm512_maskz_roundscale_round_pd_r; \ \ if (sae & SIMDE_MM_FROUND_NO_EXC) { \ fenv_t simde_mm512_maskz_roundscale_round_pd_envp; \ int simde_mm512_maskz_roundscale_round_pd_x = feholdexcept(&simde_mm512_maskz_roundscale_round_pd_envp); \ simde_mm512_maskz_roundscale_round_pd_r = simde_mm512_maskz_roundscale_pd(k, a, imm8); \ if (HEDLEY_LIKELY(simde_mm512_maskz_roundscale_round_pd_x == 0)) \ fesetenv(&simde_mm512_maskz_roundscale_round_pd_envp); \ } \ else { \ simde_mm512_maskz_roundscale_round_pd_r = simde_mm512_maskz_roundscale_pd(k, a, imm8); \ } \ \ simde_mm512_maskz_roundscale_round_pd_r; \ })) #else #define simde_mm512_maskz_roundscale_round_pd(src, k, a, imm8, sae) simde_mm512_maskz_roundscale_pd(k, a, imm8) #endif #else SIMDE_FUNCTION_ATTRIBUTES simde__m512d simde_mm512_maskz_roundscale_round_pd (simde__mmask8 k, simde__m512d a, int imm8, int sae) SIMDE_REQUIRE_RANGE(imm8, 0, 15) { simde__m512d r; if (sae & SIMDE_MM_FROUND_NO_EXC) { #if defined(SIMDE_HAVE_FENV_H) fenv_t envp; int x = feholdexcept(&envp); r = simde_mm512_maskz_roundscale_pd(k, a, imm8); if (HEDLEY_LIKELY(x == 0)) fesetenv(&envp); #else r = simde_mm512_maskz_roundscale_pd(k, a, imm8); #endif } else { r = simde_mm512_maskz_roundscale_pd(k, a, imm8); } return r; } #endif #if defined(SIMDE_X86_AVX512F_ENABLE_NATIVE_ALIASES) #undef _mm512_maskz_roundscale_round_pd #define _mm512_maskz_roundscale_round_pd(k, a, imm8, sae) simde_mm512_maskz_roundscale_round_pd(k, a, imm8, sae) #endif #if defined(SIMDE_X86_AVX512F_NATIVE) #define simde_mm_roundscale_round_ss(a, b, imm8, sae) _mm_roundscale_round_ss(a, b, imm8, sae) #elif defined(SIMDE_FAST_EXCEPTIONS) #define simde_mm_roundscale_round_ss(a, b, imm8, sae) simde_mm_roundscale_ss(a, b, imm8) #elif defined(SIMDE_STATEMENT_EXPR_) #if defined(SIMDE_HAVE_FENV_H) #define simde_mm_roundscale_round_ss(a, b, imm8, sae) SIMDE_STATEMENT_EXPR_(({ \ simde__m128 simde_mm_roundscale_round_ss_r; \ \ if (sae & SIMDE_MM_FROUND_NO_EXC) { \ fenv_t simde_mm_roundscale_round_ss_envp; \ int simde_mm_roundscale_round_ss_x = feholdexcept(&simde_mm_roundscale_round_ss_envp); \ simde_mm_roundscale_round_ss_r = simde_mm_roundscale_ss(a, b, imm8); \ if (HEDLEY_LIKELY(simde_mm_roundscale_round_ss_x == 0)) \ fesetenv(&simde_mm_roundscale_round_ss_envp); \ } \ else { \ simde_mm_roundscale_round_ss_r = simde_mm_roundscale_ss(a, b, imm8); \ } \ \ simde_mm_roundscale_round_ss_r; \ })) #else #define simde_mm_roundscale_round_ss(a, b, imm8, sae) simde_mm_roundscale_ss(a, b, imm8) #endif #elif !(defined(HEDLEY_MSVC_VERSION) && defined(SIMDE_X86_AVX_NATIVE)) SIMDE_FUNCTION_ATTRIBUTES simde__m128 simde_mm_roundscale_round_ss (simde__m128 a, simde__m128 b, const int imm8, const int sae) SIMDE_REQUIRE_CONSTANT_RANGE(imm8, 0, 255) SIMDE_REQUIRE_CONSTANT(sae) { simde__m128 r; if (sae & SIMDE_MM_FROUND_NO_EXC) { #if defined(SIMDE_HAVE_FENV_H) fenv_t envp; int x = feholdexcept(&envp); r = simde_mm_roundscale_ss(a, b, imm8); if (HEDLEY_LIKELY(x == 0)) fesetenv(&envp); #else r = simde_mm_roundscale_ss(a, b, imm8); #endif } else { r = simde_mm_roundscale_ss(a, b, imm8); } return r; } #endif #if defined(SIMDE_X86_AVX512F_ENABLE_NATIVE_ALIASES) #undef _mm_roundscale_round_ss #define _mm_roundscale_round_ss(a, b, imm8, sae) simde_mm_roundscale_round_ss(a, b, imm8, sae) #endif #if defined(SIMDE_X86_AVX512F_NATIVE) && !defined(SIMDE_BUG_GCC_92035) #define simde_mm_mask_roundscale_round_ss(src, k, a, b, imm8, sae) _mm_mask_roundscale_round_ss(src, k, a, b, imm8, sae) #elif defined(SIMDE_FAST_EXCEPTIONS) #define simde_mm_mask_roundscale_round_ss(src, k, a, b, imm8, sae) simde_mm_mask_roundscale_ss(src, k, a, b, imm8) #elif defined(SIMDE_STATEMENT_EXPR_) #if defined(SIMDE_HAVE_FENV_H) #define simde_mm_mask_roundscale_round_ss(src, k, a, b, imm8, sae) SIMDE_STATEMENT_EXPR_(({ \ simde__m128 simde_mm_mask_roundscale_round_ss_r; \ \ if (sae & SIMDE_MM_FROUND_NO_EXC) { \ fenv_t simde_mm_mask_roundscale_round_ss_envp; \ int simde_mm_mask_roundscale_round_ss_x = feholdexcept(&simde_mm_mask_roundscale_round_ss_envp); \ simde_mm_mask_roundscale_round_ss_r = simde_mm_mask_roundscale_ss(src, k, a, b, imm8); \ if (HEDLEY_LIKELY(simde_mm_mask_roundscale_round_ss_x == 0)) \ fesetenv(&simde_mm_mask_roundscale_round_ss_envp); \ } \ else { \ simde_mm_mask_roundscale_round_ss_r = simde_mm_mask_roundscale_ss(src, k, a, b, imm8); \ } \ \ simde_mm_mask_roundscale_round_ss_r; \ })) #else #define simde_mm_mask_roundscale_round_ss(src, k, a, b, imm8, sae) simde_mm_mask_roundscale_ss(src, k, a, b, imm8) #endif #elif !(defined(HEDLEY_MSVC_VERSION) && defined(SIMDE_X86_AVX_NATIVE)) SIMDE_FUNCTION_ATTRIBUTES simde__m128 simde_mm_mask_roundscale_round_ss (simde__m128 src, simde__mmask8 k, simde__m128 a, simde__m128 b, const int imm8, const int sae) SIMDE_REQUIRE_CONSTANT_RANGE(imm8, 0, 255) SIMDE_REQUIRE_CONSTANT(sae) { simde__m128 r; if (sae & SIMDE_MM_FROUND_NO_EXC) { #if defined(SIMDE_HAVE_FENV_H) fenv_t envp; int x = feholdexcept(&envp); r = simde_mm_mask_roundscale_ss(src, k, a, b, imm8); if (HEDLEY_LIKELY(x == 0)) fesetenv(&envp); #else r = simde_mm_mask_roundscale_ss(src, k, a, b, imm8); #endif } else { r = simde_mm_mask_roundscale_ss(src, k, a, b, imm8); } return r; } #endif #if defined(SIMDE_X86_AVX512F_ENABLE_NATIVE_ALIASES) #undef _mm_mask_roundscale_round_ss #define _mm_mask_roundscale_round_ss(src, k, a, b, imm8, sae) simde_mm_mask_roundscale_round_ss(src, k, a, b, imm8, sae) #endif #if defined(SIMDE_X86_AVX512F_NATIVE) && !defined(SIMDE_BUG_GCC_92035) #define simde_mm_maskz_roundscale_round_ss(k, a, b, imm8, sae) _mm_maskz_roundscale_round_ss(k, a, b, imm8, sae) #elif defined(SIMDE_FAST_EXCEPTIONS) #define simde_mm_maskz_roundscale_round_ss(k, a, b, imm8, sae) simde_mm_maskz_roundscale_ss(k, a, b, imm8) #elif defined(SIMDE_STATEMENT_EXPR_) #if defined(SIMDE_HAVE_FENV_H) #define simde_mm_maskz_roundscale_round_ss(k, a, b, imm8, sae) SIMDE_STATEMENT_EXPR_(({ \ simde__m128 simde_mm_maskz_roundscale_round_ss_r; \ \ if (sae & SIMDE_MM_FROUND_NO_EXC) { \ fenv_t simde_mm_maskz_roundscale_round_ss_envp; \ int simde_mm_maskz_roundscale_round_ss_x = feholdexcept(&simde_mm_maskz_roundscale_round_ss_envp); \ simde_mm_maskz_roundscale_round_ss_r = simde_mm_maskz_roundscale_ss(k, a, b, imm8); \ if (HEDLEY_LIKELY(simde_mm_maskz_roundscale_round_ss_x == 0)) \ fesetenv(&simde_mm_maskz_roundscale_round_ss_envp); \ } \ else { \ simde_mm_maskz_roundscale_round_ss_r = simde_mm_maskz_roundscale_ss(k, a, b, imm8); \ } \ \ simde_mm_maskz_roundscale_round_ss_r; \ })) #else #define simde_mm_maskz_roundscale_round_ss(k, a, b, imm8, sae) simde_mm_maskz_roundscale_ss(k, a, b, imm8) #endif #elif !(defined(HEDLEY_MSVC_VERSION) && defined(SIMDE_X86_AVX_NATIVE)) SIMDE_FUNCTION_ATTRIBUTES simde__m128 simde_mm_maskz_roundscale_round_ss (simde__mmask8 k, simde__m128 a, simde__m128 b, const int imm8, const int sae) SIMDE_REQUIRE_CONSTANT_RANGE(imm8, 0, 255) SIMDE_REQUIRE_CONSTANT(sae) { simde__m128 r; if (sae & SIMDE_MM_FROUND_NO_EXC) { #if defined(SIMDE_HAVE_FENV_H) fenv_t envp; int x = feholdexcept(&envp); r = simde_mm_maskz_roundscale_ss(k, a, b, imm8); if (HEDLEY_LIKELY(x == 0)) fesetenv(&envp); #else r = simde_mm_maskz_roundscale_ss(k, a, b, imm8); #endif } else { r = simde_mm_maskz_roundscale_ss(k, a, b, imm8); } return r; } #endif #if defined(SIMDE_X86_AVX512F_ENABLE_NATIVE_ALIASES) #undef _mm_maskz_roundscale_round_ss #define _mm_maskz_roundscale_round_ss(k, a, b, imm8, sae) simde_mm_maskz_roundscale_round_ss(k, a, b, imm8, sae) #endif #if defined(HEDLEY_MSVC_VERSION) #pragma warning( pop ) #endif #if defined(SIMDE_X86_AVX512F_NATIVE) #define simde_mm_roundscale_round_sd(a, b, imm8, sae) _mm_roundscale_round_sd(a, b, imm8, sae) #elif defined(SIMDE_FAST_EXCEPTIONS) #define simde_mm_roundscale_round_sd(a, b, imm8, sae) simde_mm_roundscale_sd(a, b, imm8) #elif defined(SIMDE_STATEMENT_EXPR_) #if defined(SIMDE_HAVE_FENV_H) #define simde_mm_roundscale_round_sd(a, b, imm8, sae) SIMDE_STATEMENT_EXPR_(({ \ simde__m128d simde_mm_roundscale_round_sd_r; \ \ if (sae & SIMDE_MM_FROUND_NO_EXC) { \ fenv_t simde_mm_roundscale_round_sd_envp; \ int simde_mm_roundscale_round_sd_x = feholdexcept(&simde_mm_roundscale_round_sd_envp); \ simde_mm_roundscale_round_sd_r = simde_mm_roundscale_sd(a, b, imm8); \ if (HEDLEY_LIKELY(simde_mm_roundscale_round_sd_x == 0)) \ fesetenv(&simde_mm_roundscale_round_sd_envp); \ } \ else { \ simde_mm_roundscale_round_sd_r = simde_mm_roundscale_sd(a, b, imm8); \ } \ \ simde_mm_roundscale_round_sd_r; \ })) #else #define simde_mm_roundscale_round_sd(a, b, imm8, sae) simde_mm_roundscale_sd(a, b, imm8) #endif #elif !(defined(HEDLEY_MSVC_VERSION) && defined(SIMDE_X86_AVX_NATIVE)) SIMDE_FUNCTION_ATTRIBUTES simde__m128d simde_mm_roundscale_round_sd (simde__m128d a, simde__m128d b, const int imm8, const int sae) SIMDE_REQUIRE_CONSTANT_RANGE(imm8, 0, 255) SIMDE_REQUIRE_CONSTANT(sae) { simde__m128d r; if (sae & SIMDE_MM_FROUND_NO_EXC) { #if defined(SIMDE_HAVE_FENV_H) fenv_t envp; int x = feholdexcept(&envp); r = simde_mm_roundscale_sd(a, b, imm8); if (HEDLEY_LIKELY(x == 0)) fesetenv(&envp); #else r = simde_mm_roundscale_sd(a, b, imm8); #endif } else { r = simde_mm_roundscale_sd(a, b, imm8); } return r; } #endif #if defined(SIMDE_X86_AVX512F_ENABLE_NATIVE_ALIASES) #undef _mm_roundscale_round_sd #define _mm_roundscale_round_sd(a, b, imm8, sae) simde_mm_roundscale_round_sd(a, b, imm8, sae) #endif #if defined(SIMDE_X86_AVX512F_NATIVE) && !defined(SIMDE_BUG_GCC_92035) #define simde_mm_mask_roundscale_round_sd(src, k, a, b, imm8, sae) _mm_mask_roundscale_round_sd(src, k, a, b, imm8, sae) #elif defined(SIMDE_FAST_EXCEPTIONS) #define simde_mm_mask_roundscale_round_sd(src, k, a, b, imm8, sae) simde_mm_mask_roundscale_sd(src, k, a, b, imm8) #elif defined(SIMDE_STATEMENT_EXPR_) #if defined(SIMDE_HAVE_FENV_H) #define simde_mm_mask_roundscale_round_sd(src, k, a, b, imm8, sae) SIMDE_STATEMENT_EXPR_(({ \ simde__m128d simde_mm_mask_roundscale_round_sd_r; \ \ if (sae & SIMDE_MM_FROUND_NO_EXC) { \ fenv_t simde_mm_mask_roundscale_round_sd_envp; \ int simde_mm_mask_roundscale_round_sd_x = feholdexcept(&simde_mm_mask_roundscale_round_sd_envp); \ simde_mm_mask_roundscale_round_sd_r = simde_mm_mask_roundscale_sd(src, k, a, b, imm8); \ if (HEDLEY_LIKELY(simde_mm_mask_roundscale_round_sd_x == 0)) \ fesetenv(&simde_mm_mask_roundscale_round_sd_envp); \ } \ else { \ simde_mm_mask_roundscale_round_sd_r = simde_mm_mask_roundscale_sd(src, k, a, b, imm8); \ } \ \ simde_mm_mask_roundscale_round_sd_r; \ })) #else #define simde_mm_mask_roundscale_round_sd(src, k, a, b, imm8, sae) simde_mm_mask_roundscale_sd(src, k, a, b, imm8) #endif #elif !(defined(HEDLEY_MSVC_VERSION) && defined(SIMDE_X86_AVX_NATIVE)) SIMDE_FUNCTION_ATTRIBUTES simde__m128d simde_mm_mask_roundscale_round_sd (simde__m128d src, simde__mmask8 k, simde__m128d a, simde__m128d b, const int imm8, const int sae) SIMDE_REQUIRE_CONSTANT_RANGE(imm8, 0, 255) SIMDE_REQUIRE_CONSTANT(sae) { simde__m128d r; if (sae & SIMDE_MM_FROUND_NO_EXC) { #if defined(SIMDE_HAVE_FENV_H) fenv_t envp; int x = feholdexcept(&envp); r = simde_mm_mask_roundscale_sd(src, k, a, b, imm8); if (HEDLEY_LIKELY(x == 0)) fesetenv(&envp); #else r = simde_mm_mask_roundscale_sd(src, k, a, b, imm8); #endif } else { r = simde_mm_mask_roundscale_sd(src, k, a, b, imm8); } return r; } #endif #if defined(SIMDE_X86_AVX512F_ENABLE_NATIVE_ALIASES) #undef _mm_mask_roundscale_round_sd #define _mm_mask_roundscale_round_sd(src, k, a, b, imm8, sae) simde_mm_mask_roundscale_round_sd(src, k, a, b, imm8, sae) #endif #if defined(SIMDE_X86_AVX512F_NATIVE) && !defined(SIMDE_BUG_GCC_92035) #define simde_mm_maskz_roundscale_round_sd(k, a, b, imm8, sae) _mm_maskz_roundscale_round_sd(k, a, b, imm8, sae) #elif defined(SIMDE_FAST_EXCEPTIONS) #define simde_mm_maskz_roundscale_round_sd(k, a, b, imm8, sae) simde_mm_maskz_roundscale_sd(k, a, b, imm8) #elif defined(SIMDE_STATEMENT_EXPR_) #if defined(SIMDE_HAVE_FENV_H) #define simde_mm_maskz_roundscale_round_sd(k, a, b, imm8, sae) SIMDE_STATEMENT_EXPR_(({ \ simde__m128d simde_mm_maskz_roundscale_round_sd_r; \ \ if (sae & SIMDE_MM_FROUND_NO_EXC) { \ fenv_t simde_mm_maskz_roundscale_round_sd_envp; \ int simde_mm_maskz_roundscale_round_sd_x = feholdexcept(&simde_mm_maskz_roundscale_round_sd_envp); \ simde_mm_maskz_roundscale_round_sd_r = simde_mm_maskz_roundscale_sd(k, a, b, imm8); \ if (HEDLEY_LIKELY(simde_mm_maskz_roundscale_round_sd_x == 0)) \ fesetenv(&simde_mm_maskz_roundscale_round_sd_envp); \ } \ else { \ simde_mm_maskz_roundscale_round_sd_r = simde_mm_maskz_roundscale_sd(k, a, b, imm8); \ } \ \ simde_mm_maskz_roundscale_round_sd_r; \ })) #else #define simde_mm_maskz_roundscale_round_sd(k, a, b, imm8, sae) simde_mm_maskz_roundscale_sd(k, a, b, imm8) #endif #elif !(defined(HEDLEY_MSVC_VERSION) && defined(SIMDE_X86_AVX_NATIVE)) SIMDE_FUNCTION_ATTRIBUTES simde__m128d simde_mm_maskz_roundscale_round_sd (simde__mmask8 k, simde__m128d a, simde__m128d b, const int imm8, const int sae) SIMDE_REQUIRE_CONSTANT_RANGE(imm8, 0, 255) SIMDE_REQUIRE_CONSTANT(sae) { simde__m128d r; if (sae & SIMDE_MM_FROUND_NO_EXC) { #if defined(SIMDE_HAVE_FENV_H) fenv_t envp; int x = feholdexcept(&envp); r = simde_mm_maskz_roundscale_sd(k, a, b, imm8); if (HEDLEY_LIKELY(x == 0)) fesetenv(&envp); #else r = simde_mm_maskz_roundscale_sd(k, a, b, imm8); #endif } else { r = simde_mm_maskz_roundscale_sd(k, a, b, imm8); } return r; } #endif #if defined(SIMDE_X86_AVX512F_ENABLE_NATIVE_ALIASES) #undef _mm_maskz_roundscale_round_sd #define _mm_maskz_roundscale_round_sd(k, a, b, imm8, sae) simde_mm_maskz_roundscale_round_sd(k, a, b, imm8, sae) #endif SIMDE_END_DECLS_ HEDLEY_DIAGNOSTIC_POP #endif /* !defined(SIMDE_X86_AVX512_ROUNDSCALE_ROUND_H) */