687 lines
26 KiB
C
687 lines
26 KiB
C
#if !defined(SIMDE_X86_AVX512_ROUNDSCALE_ROUND_H)
|
|
#define SIMDE_X86_AVX512_ROUNDSCALE_ROUND_H
|
|
|
|
#include "types.h"
|
|
#include "roundscale.h"
|
|
|
|
HEDLEY_DIAGNOSTIC_PUSH
|
|
SIMDE_DISABLE_UNWANTED_DIAGNOSTICS
|
|
SIMDE_BEGIN_DECLS_
|
|
|
|
#if defined(SIMDE_X86_AVX512F_NATIVE)
|
|
#define simde_mm512_roundscale_round_ps(a, imm8, sae) _mm512_roundscale_round_ps(a, imm8, sae)
|
|
#elif defined(SIMDE_FAST_EXCEPTIONS)
|
|
#define simde_mm512_roundscale_round_ps(a, imm8, sae) simde_mm512_roundscale_ps(a, imm8)
|
|
#elif defined(SIMDE_STATEMENT_EXPR_)
|
|
#if defined(SIMDE_HAVE_FENV_H)
|
|
#define simde_mm512_roundscale_round_ps(a,imm8, sae) SIMDE_STATEMENT_EXPR_(({ \
|
|
simde__m512 simde_mm512_roundscale_round_ps_r; \
|
|
\
|
|
if (sae & SIMDE_MM_FROUND_NO_EXC) { \
|
|
fenv_t simde_mm512_roundscale_round_ps_envp; \
|
|
int simde_mm512_roundscale_round_ps_x = feholdexcept(&simde_mm512_roundscale_round_ps_envp); \
|
|
simde_mm512_roundscale_round_ps_r = simde_mm512_roundscale_ps(a, imm8); \
|
|
if (HEDLEY_LIKELY(simde_mm512_roundscale_round_ps_x == 0)) \
|
|
fesetenv(&simde_mm512_roundscale_round_ps_envp); \
|
|
} \
|
|
else { \
|
|
simde_mm512_roundscale_round_ps_r = simde_mm512_roundscale_ps(a, imm8); \
|
|
} \
|
|
\
|
|
simde_mm512_roundscale_round_ps_r; \
|
|
}))
|
|
#else
|
|
#define simde_mm512_roundscale_round_ps(a, imm8, sae) simde_mm512_roundscale_ps(a, imm8)
|
|
#endif
|
|
#else
|
|
SIMDE_FUNCTION_ATTRIBUTES
|
|
simde__m512
|
|
simde_mm512_roundscale_round_ps (simde__m512 a, int imm8, int sae)
|
|
SIMDE_REQUIRE_CONSTANT_RANGE(imm8, 0, 15)
|
|
SIMDE_REQUIRE_CONSTANT(sae) {
|
|
simde__m512 r;
|
|
|
|
if (sae & SIMDE_MM_FROUND_NO_EXC) {
|
|
#if defined(SIMDE_HAVE_FENV_H)
|
|
fenv_t envp;
|
|
int x = feholdexcept(&envp);
|
|
r = simde_mm512_roundscale_ps(a, imm8);
|
|
if (HEDLEY_LIKELY(x == 0))
|
|
fesetenv(&envp);
|
|
#else
|
|
r = simde_mm512_roundscale_ps(a, imm8);
|
|
#endif
|
|
}
|
|
else {
|
|
r = simde_mm512_roundscale_ps(a, imm8);
|
|
}
|
|
|
|
return r;
|
|
}
|
|
#endif
|
|
#if defined(SIMDE_X86_AVX512F_ENABLE_NATIVE_ALIASES)
|
|
#undef _mm512_roundscale_round_ps
|
|
#define _mm512_roundscale_round_ps(a, imm8, sae) simde_mm512_roundscale_round_ps(a, imm8, sae)
|
|
#endif
|
|
|
|
#if defined(SIMDE_X86_AVX512F_NATIVE) && !defined(SIMDE_BUG_GCC_92035)
|
|
#define simde_mm512_mask_roundscale_round_ps(src, k, a, imm8, sae) _mm512_mask_roundscale_round_ps(src, k, a, imm8, sae)
|
|
#elif defined(SIMDE_FAST_EXCEPTIONS)
|
|
#define simde_mm512_mask_roundscale_round_ps(src, k, a, imm8, sae) simde_mm512_mask_roundscale_ps(src, k, a, imm8)
|
|
#elif defined(SIMDE_STATEMENT_EXPR_)
|
|
#if defined(SIMDE_HAVE_FENV_H)
|
|
#define simde_mm512_mask_roundscale_round_ps(src, k, a, imm8, sae) SIMDE_STATEMENT_EXPR_(({ \
|
|
simde__m512 simde_mm512_mask_roundscale_round_ps_r; \
|
|
\
|
|
if (sae & SIMDE_MM_FROUND_NO_EXC) { \
|
|
fenv_t simde_mm512_mask_roundscale_round_ps_envp; \
|
|
int simde_mm512_mask_roundscale_round_ps_x = feholdexcept(&simde_mm512_mask_roundscale_round_ps_envp); \
|
|
simde_mm512_mask_roundscale_round_ps_r = simde_mm512_mask_roundscale_ps(src, k, a, imm8); \
|
|
if (HEDLEY_LIKELY(simde_mm512_mask_roundscale_round_ps_x == 0)) \
|
|
fesetenv(&simde_mm512_mask_roundscale_round_ps_envp); \
|
|
} \
|
|
else { \
|
|
simde_mm512_mask_roundscale_round_ps_r = simde_mm512_mask_roundscale_ps(src, k, a, imm8); \
|
|
} \
|
|
\
|
|
simde_mm512_mask_roundscale_round_ps_r; \
|
|
}))
|
|
#else
|
|
#define simde_mm512_mask_roundscale_round_ps(src, k, a, imm8, sae) simde_mm512_mask_roundscale_ps(src, k, a, imm8)
|
|
#endif
|
|
#else
|
|
SIMDE_FUNCTION_ATTRIBUTES
|
|
simde__m512
|
|
simde_mm512_mask_roundscale_round_ps (simde__m512 src, simde__mmask8 k, simde__m512 a, int imm8, int sae)
|
|
SIMDE_REQUIRE_CONSTANT_RANGE(imm8, 0, 15)
|
|
SIMDE_REQUIRE_CONSTANT(sae) {
|
|
simde__m512 r;
|
|
|
|
if (sae & SIMDE_MM_FROUND_NO_EXC) {
|
|
#if defined(SIMDE_HAVE_FENV_H)
|
|
fenv_t envp;
|
|
int x = feholdexcept(&envp);
|
|
r = simde_mm512_mask_roundscale_ps(src, k, a, imm8);
|
|
if (HEDLEY_LIKELY(x == 0))
|
|
fesetenv(&envp);
|
|
#else
|
|
r = simde_mm512_mask_roundscale_ps(src, k, a, imm8);
|
|
#endif
|
|
}
|
|
else {
|
|
r = simde_mm512_mask_roundscale_ps(src, k, a, imm8);
|
|
}
|
|
|
|
return r;
|
|
}
|
|
#endif
|
|
#if defined(SIMDE_X86_AVX512F_ENABLE_NATIVE_ALIASES)
|
|
#undef _mm512_mask_roundscale_round_ps
|
|
#define _mm512_mask_roundscale_round_ps(src, k, a, imm8, sae) simde_mm512_mask_roundscale_round_ps(src, k, a, imm8, sae)
|
|
#endif
|
|
|
|
#if defined(SIMDE_X86_AVX512F_NATIVE) && !defined(SIMDE_BUG_GCC_92035)
|
|
#define simde_mm512_maskz_roundscale_round_ps(k, a, imm8, sae) _mm512_maskz_roundscale_round_ps(k, a, imm8, sae)
|
|
#elif defined(SIMDE_FAST_EXCEPTIONS)
|
|
#define simde_mm512_maskz_roundscale_round_ps(k, a, imm8, sae) simde_mm512_maskz_roundscale_ps(k, a, imm8)
|
|
#elif defined(SIMDE_STATEMENT_EXPR_)
|
|
#if defined(SIMDE_HAVE_FENV_H)
|
|
#define simde_mm512_maskz_roundscale_round_ps(k, a, imm8, sae) SIMDE_STATEMENT_EXPR_(({ \
|
|
simde__m512 simde_mm512_maskz_roundscale_round_ps_r; \
|
|
\
|
|
if (sae & SIMDE_MM_FROUND_NO_EXC) { \
|
|
fenv_t simde_mm512_maskz_roundscale_round_ps_envp; \
|
|
int simde_mm512_maskz_roundscale_round_ps_x = feholdexcept(&simde_mm512_maskz_roundscale_round_ps_envp); \
|
|
simde_mm512_maskz_roundscale_round_ps_r = simde_mm512_maskz_roundscale_ps(k, a, imm8); \
|
|
if (HEDLEY_LIKELY(simde_mm512_maskz_roundscale_round_ps_x == 0)) \
|
|
fesetenv(&simde_mm512_maskz_roundscale_round_ps_envp); \
|
|
} \
|
|
else { \
|
|
simde_mm512_maskz_roundscale_round_ps_r = simde_mm512_maskz_roundscale_ps(k, a, imm8); \
|
|
} \
|
|
\
|
|
simde_mm512_maskz_roundscale_round_ps_r; \
|
|
}))
|
|
#else
|
|
#define simde_mm512_maskz_roundscale_round_ps(src, k, a, imm8, sae) simde_mm512_maskz_roundscale_ps(k, a, imm8)
|
|
#endif
|
|
#else
|
|
SIMDE_FUNCTION_ATTRIBUTES
|
|
simde__m512
|
|
simde_mm512_maskz_roundscale_round_ps (simde__mmask8 k, simde__m512 a, int imm8, int sae)
|
|
SIMDE_REQUIRE_CONSTANT_RANGE(imm8, 0, 15)
|
|
SIMDE_REQUIRE_CONSTANT(sae) {
|
|
simde__m512 r;
|
|
|
|
if (sae & SIMDE_MM_FROUND_NO_EXC) {
|
|
#if defined(SIMDE_HAVE_FENV_H)
|
|
fenv_t envp;
|
|
int x = feholdexcept(&envp);
|
|
r = simde_mm512_maskz_roundscale_ps(k, a, imm8);
|
|
if (HEDLEY_LIKELY(x == 0))
|
|
fesetenv(&envp);
|
|
#else
|
|
r = simde_mm512_maskz_roundscale_ps(k, a, imm8);
|
|
#endif
|
|
}
|
|
else {
|
|
r = simde_mm512_maskz_roundscale_ps(k, a, imm8);
|
|
}
|
|
|
|
return r;
|
|
}
|
|
#endif
|
|
#if defined(SIMDE_X86_AVX512F_ENABLE_NATIVE_ALIASES)
|
|
#undef _mm512_maskz_roundscale_round_ps
|
|
#define _mm512_maskz_roundscale_round_ps(k, a, imm8, sae) simde_mm512_maskz_roundscale_round_ps(k, a, imm8, sae)
|
|
#endif
|
|
|
|
#if defined(SIMDE_X86_AVX512F_NATIVE)
|
|
#define simde_mm512_roundscale_round_pd(a, imm8, sae) _mm512_roundscale_round_pd(a, imm8, sae)
|
|
#elif defined(SIMDE_FAST_EXCEPTIONS)
|
|
#define simde_mm512_roundscale_round_pd(a, imm8, sae) simde_mm512_roundscale_pd(a, imm8)
|
|
#elif defined(SIMDE_STATEMENT_EXPR_)
|
|
#if defined(SIMDE_HAVE_FENV_H)
|
|
#define simde_mm512_roundscale_round_pd(a, imm8, sae) SIMDE_STATEMENT_EXPR_(({ \
|
|
simde__m512d simde_mm512_roundscale_round_pd_r; \
|
|
\
|
|
if (sae & SIMDE_MM_FROUND_NO_EXC) { \
|
|
fenv_t simde_mm512_roundscale_round_pd_envp; \
|
|
int simde_mm512_roundscale_round_pd_x = feholdexcept(&simde_mm512_roundscale_round_pd_envp); \
|
|
simde_mm512_roundscale_round_pd_r = simde_mm512_roundscale_pd(a, imm8); \
|
|
if (HEDLEY_LIKELY(simde_mm512_roundscale_round_pd_x == 0)) \
|
|
fesetenv(&simde_mm512_roundscale_round_pd_envp); \
|
|
} \
|
|
else { \
|
|
simde_mm512_roundscale_round_pd_r = simde_mm512_roundscale_pd(a, imm8); \
|
|
} \
|
|
\
|
|
simde_mm512_roundscale_round_pd_r; \
|
|
}))
|
|
#else
|
|
#define simde_mm512_roundscale_round_pd(a, imm8, sae) simde_mm512_roundscale_pd(a, imm8)
|
|
#endif
|
|
#else
|
|
SIMDE_FUNCTION_ATTRIBUTES
|
|
simde__m512d
|
|
simde_mm512_roundscale_round_pd (simde__m512d a, int imm8, int sae)
|
|
SIMDE_REQUIRE_CONSTANT_RANGE(imm8, 0, 15)
|
|
SIMDE_REQUIRE_CONSTANT(sae) {
|
|
simde__m512d r;
|
|
|
|
if (sae & SIMDE_MM_FROUND_NO_EXC) {
|
|
#if defined(SIMDE_HAVE_FENV_H)
|
|
fenv_t envp;
|
|
int x = feholdexcept(&envp);
|
|
r = simde_mm512_roundscale_pd(a, imm8);
|
|
if (HEDLEY_LIKELY(x == 0))
|
|
fesetenv(&envp);
|
|
#else
|
|
r = simde_mm512_roundscale_pd(a, imm8);
|
|
#endif
|
|
}
|
|
else {
|
|
r = simde_mm512_roundscale_pd(a, imm8);
|
|
}
|
|
|
|
return r;
|
|
}
|
|
#endif
|
|
#if defined(SIMDE_X86_AVX512F_ENABLE_NATIVE_ALIASES)
|
|
#undef _mm512_roundscale_round_pd
|
|
#define _mm512_roundscale_round_pd(a, imm8, sae) simde_mm512_roundscale_round_pd(a, imm8, sae)
|
|
#endif
|
|
|
|
#if defined(SIMDE_X86_AVX512F_NATIVE) && !defined(SIMDE_BUG_GCC_92035)
|
|
#define simde_mm512_mask_roundscale_round_pd(src, k, a, imm8, sae) _mm512_mask_roundscale_round_pd(src, k, a, imm8, sae)
|
|
#elif defined(SIMDE_FAST_EXCEPTIONS)
|
|
#define simde_mm512_mask_roundscale_round_pd(src, k, a, imm8, sae) simde_mm512_mask_roundscale_pd(src, k, a, imm8)
|
|
#elif defined(SIMDE_STATEMENT_EXPR_)
|
|
#if defined(SIMDE_HAVE_FENV_H)
|
|
#define simde_mm512_mask_roundscale_round_pd(src, k, a, imm8, sae) SIMDE_STATEMENT_EXPR_(({ \
|
|
simde__m512d simde_mm512_mask_roundscale_round_pd_r; \
|
|
\
|
|
if (sae & SIMDE_MM_FROUND_NO_EXC) { \
|
|
fenv_t simde_mm512_mask_roundscale_round_pd_envp; \
|
|
int simde_mm512_mask_roundscale_round_pd_x = feholdexcept(&simde_mm512_mask_roundscale_round_pd_envp); \
|
|
simde_mm512_mask_roundscale_round_pd_r = simde_mm512_mask_roundscale_pd(src, k, a, imm8); \
|
|
if (HEDLEY_LIKELY(simde_mm512_mask_roundscale_round_pd_x == 0)) \
|
|
fesetenv(&simde_mm512_mask_roundscale_round_pd_envp); \
|
|
} \
|
|
else { \
|
|
simde_mm512_mask_roundscale_round_pd_r = simde_mm512_mask_roundscale_pd(src, k, a, imm8); \
|
|
} \
|
|
\
|
|
simde_mm512_mask_roundscale_round_pd_r; \
|
|
}))
|
|
#else
|
|
#define simde_mm512_mask_roundscale_round_pd(src, k, a, imm8, sae) simde_mm512_mask_roundscale_pd(src, k, a, imm8)
|
|
#endif
|
|
#else
|
|
SIMDE_FUNCTION_ATTRIBUTES
|
|
simde__m512d
|
|
simde_mm512_mask_roundscale_round_pd (simde__m512d src, simde__mmask8 k, simde__m512d a, int imm8, int sae)
|
|
SIMDE_REQUIRE_CONSTANT_RANGE(imm8, 0, 15)
|
|
SIMDE_REQUIRE_CONSTANT(sae) {
|
|
simde__m512d r;
|
|
|
|
if (sae & SIMDE_MM_FROUND_NO_EXC) {
|
|
#if defined(SIMDE_HAVE_FENV_H)
|
|
fenv_t envp;
|
|
int x = feholdexcept(&envp);
|
|
r = simde_mm512_mask_roundscale_pd(src, k, a, imm8);
|
|
if (HEDLEY_LIKELY(x == 0))
|
|
fesetenv(&envp);
|
|
#else
|
|
r = simde_mm512_mask_roundscale_pd(src, k, a, imm8);
|
|
#endif
|
|
}
|
|
else {
|
|
r = simde_mm512_mask_roundscale_pd(src, k, a, imm8);
|
|
}
|
|
|
|
return r;
|
|
}
|
|
#endif
|
|
#if defined(SIMDE_X86_AVX512F_ENABLE_NATIVE_ALIASES)
|
|
#undef _mm512_mask_roundscale_round_pd
|
|
#define _mm512_mask_roundscale_round_pd(src, k, a, imm8, sae) simde_mm512_mask_roundscale_round_pd(src, k, a, imm8, sae)
|
|
#endif
|
|
|
|
#if defined(SIMDE_X86_AVX512F_NATIVE) && !defined(SIMDE_BUG_GCC_92035)
|
|
#define simde_mm512_maskz_roundscale_round_pd(k, a, imm8, sae) _mm512_maskz_roundscale_round_pd(k, a, imm8, sae)
|
|
#elif defined(SIMDE_FAST_EXCEPTIONS)
|
|
#define simde_mm512_maskz_roundscale_round_pd(k, a, imm8, sae) simde_mm512_maskz_roundscale_pd(k, a, imm8)
|
|
#elif defined(SIMDE_STATEMENT_EXPR_)
|
|
#if defined(SIMDE_HAVE_FENV_H)
|
|
#define simde_mm512_maskz_roundscale_round_pd(k, a, imm8, sae) SIMDE_STATEMENT_EXPR_(({ \
|
|
simde__m512d simde_mm512_maskz_roundscale_round_pd_r; \
|
|
\
|
|
if (sae & SIMDE_MM_FROUND_NO_EXC) { \
|
|
fenv_t simde_mm512_maskz_roundscale_round_pd_envp; \
|
|
int simde_mm512_maskz_roundscale_round_pd_x = feholdexcept(&simde_mm512_maskz_roundscale_round_pd_envp); \
|
|
simde_mm512_maskz_roundscale_round_pd_r = simde_mm512_maskz_roundscale_pd(k, a, imm8); \
|
|
if (HEDLEY_LIKELY(simde_mm512_maskz_roundscale_round_pd_x == 0)) \
|
|
fesetenv(&simde_mm512_maskz_roundscale_round_pd_envp); \
|
|
} \
|
|
else { \
|
|
simde_mm512_maskz_roundscale_round_pd_r = simde_mm512_maskz_roundscale_pd(k, a, imm8); \
|
|
} \
|
|
\
|
|
simde_mm512_maskz_roundscale_round_pd_r; \
|
|
}))
|
|
#else
|
|
#define simde_mm512_maskz_roundscale_round_pd(src, k, a, imm8, sae) simde_mm512_maskz_roundscale_pd(k, a, imm8)
|
|
#endif
|
|
#else
|
|
SIMDE_FUNCTION_ATTRIBUTES
|
|
simde__m512d
|
|
simde_mm512_maskz_roundscale_round_pd (simde__mmask8 k, simde__m512d a, int imm8, int sae)
|
|
SIMDE_REQUIRE_CONSTANT_RANGE(imm8, 0, 15)
|
|
SIMDE_REQUIRE_CONSTANT(sae) {
|
|
simde__m512d r;
|
|
|
|
if (sae & SIMDE_MM_FROUND_NO_EXC) {
|
|
#if defined(SIMDE_HAVE_FENV_H)
|
|
fenv_t envp;
|
|
int x = feholdexcept(&envp);
|
|
r = simde_mm512_maskz_roundscale_pd(k, a, imm8);
|
|
if (HEDLEY_LIKELY(x == 0))
|
|
fesetenv(&envp);
|
|
#else
|
|
r = simde_mm512_maskz_roundscale_pd(k, a, imm8);
|
|
#endif
|
|
}
|
|
else {
|
|
r = simde_mm512_maskz_roundscale_pd(k, a, imm8);
|
|
}
|
|
|
|
return r;
|
|
}
|
|
#endif
|
|
#if defined(SIMDE_X86_AVX512F_ENABLE_NATIVE_ALIASES)
|
|
#undef _mm512_maskz_roundscale_round_pd
|
|
#define _mm512_maskz_roundscale_round_pd(k, a, imm8, sae) simde_mm512_maskz_roundscale_round_pd(k, a, imm8, sae)
|
|
#endif
|
|
|
|
#if defined(SIMDE_X86_AVX512F_NATIVE)
|
|
#define simde_mm_roundscale_round_ss(a, b, imm8, sae) _mm_roundscale_round_ss(a, b, imm8, sae)
|
|
#elif defined(SIMDE_FAST_EXCEPTIONS)
|
|
#define simde_mm_roundscale_round_ss(a, b, imm8, sae) simde_mm_roundscale_ss(a, b, imm8)
|
|
#elif defined(SIMDE_STATEMENT_EXPR_)
|
|
#if defined(SIMDE_HAVE_FENV_H)
|
|
#define simde_mm_roundscale_round_ss(a, b, imm8, sae) SIMDE_STATEMENT_EXPR_(({ \
|
|
simde__m128 simde_mm_roundscale_round_ss_r; \
|
|
\
|
|
if (sae & SIMDE_MM_FROUND_NO_EXC) { \
|
|
fenv_t simde_mm_roundscale_round_ss_envp; \
|
|
int simde_mm_roundscale_round_ss_x = feholdexcept(&simde_mm_roundscale_round_ss_envp); \
|
|
simde_mm_roundscale_round_ss_r = simde_mm_roundscale_ss(a, b, imm8); \
|
|
if (HEDLEY_LIKELY(simde_mm_roundscale_round_ss_x == 0)) \
|
|
fesetenv(&simde_mm_roundscale_round_ss_envp); \
|
|
} \
|
|
else { \
|
|
simde_mm_roundscale_round_ss_r = simde_mm_roundscale_ss(a, b, imm8); \
|
|
} \
|
|
\
|
|
simde_mm_roundscale_round_ss_r; \
|
|
}))
|
|
#else
|
|
#define simde_mm_roundscale_round_ss(a, b, imm8, sae) simde_mm_roundscale_ss(a, b, imm8)
|
|
#endif
|
|
#else
|
|
SIMDE_FUNCTION_ATTRIBUTES
|
|
simde__m128
|
|
simde_mm_roundscale_round_ss (simde__m128 a, simde__m128 b, int imm8, int sae)
|
|
SIMDE_REQUIRE_CONSTANT_RANGE(imm8, 0, 255)
|
|
SIMDE_REQUIRE_CONSTANT(sae) {
|
|
simde__m128 r;
|
|
|
|
if (sae & SIMDE_MM_FROUND_NO_EXC) {
|
|
#if defined(SIMDE_HAVE_FENV_H)
|
|
fenv_t envp;
|
|
int x = feholdexcept(&envp);
|
|
r = simde_mm_roundscale_ss(a, b, imm8);
|
|
if (HEDLEY_LIKELY(x == 0))
|
|
fesetenv(&envp);
|
|
#else
|
|
r = simde_mm_roundscale_ss(a, b, imm8);
|
|
#endif
|
|
}
|
|
else {
|
|
r = simde_mm_roundscale_ss(a, b, imm8);
|
|
}
|
|
|
|
return r;
|
|
}
|
|
#endif
|
|
#if defined(SIMDE_X86_AVX512F_ENABLE_NATIVE_ALIASES)
|
|
#undef _mm_roundscale_round_ss
|
|
#define _mm_roundscale_round_ss(a, b, imm8, sae) simde_mm_roundscale_round_ss(a, b, imm8, sae)
|
|
#endif
|
|
|
|
#if defined(SIMDE_X86_AVX512F_NATIVE) && !defined(SIMDE_BUG_GCC_92035)
|
|
#define simde_mm_mask_roundscale_round_ss(src, k, a, b, imm8, sae) _mm_mask_roundscale_round_ss(src, k, a, b, imm8, sae)
|
|
#elif defined(SIMDE_FAST_EXCEPTIONS)
|
|
#define simde_mm_mask_roundscale_round_ss(src, k, a, b, imm8, sae) simde_mm_mask_roundscale_ss(src, k, a, b, imm8)
|
|
#elif defined(SIMDE_STATEMENT_EXPR_)
|
|
#if defined(SIMDE_HAVE_FENV_H)
|
|
#define simde_mm_mask_roundscale_round_ss(src, k, a, b, imm8, sae) SIMDE_STATEMENT_EXPR_(({ \
|
|
simde__m128 simde_mm_mask_roundscale_round_ss_r; \
|
|
\
|
|
if (sae & SIMDE_MM_FROUND_NO_EXC) { \
|
|
fenv_t simde_mm_mask_roundscale_round_ss_envp; \
|
|
int simde_mm_mask_roundscale_round_ss_x = feholdexcept(&simde_mm_mask_roundscale_round_ss_envp); \
|
|
simde_mm_mask_roundscale_round_ss_r = simde_mm_mask_roundscale_ss(src, k, a, b, imm8); \
|
|
if (HEDLEY_LIKELY(simde_mm_mask_roundscale_round_ss_x == 0)) \
|
|
fesetenv(&simde_mm_mask_roundscale_round_ss_envp); \
|
|
} \
|
|
else { \
|
|
simde_mm_mask_roundscale_round_ss_r = simde_mm_mask_roundscale_ss(src, k, a, b, imm8); \
|
|
} \
|
|
\
|
|
simde_mm_mask_roundscale_round_ss_r; \
|
|
}))
|
|
#else
|
|
#define simde_mm_mask_roundscale_round_ss(src, k, a, b, imm8, sae) simde_mm_mask_roundscale_ss(src, k, a, b, imm8)
|
|
#endif
|
|
#else
|
|
SIMDE_FUNCTION_ATTRIBUTES
|
|
simde__m128
|
|
simde_mm_mask_roundscale_round_ss (simde__m128 src, simde__mmask8 k, simde__m128 a, simde__m128 b, int imm8, int sae)
|
|
SIMDE_REQUIRE_CONSTANT_RANGE(imm8, 0, 255)
|
|
SIMDE_REQUIRE_CONSTANT(sae) {
|
|
simde__m128 r;
|
|
|
|
if (sae & SIMDE_MM_FROUND_NO_EXC) {
|
|
#if defined(SIMDE_HAVE_FENV_H)
|
|
fenv_t envp;
|
|
int x = feholdexcept(&envp);
|
|
r = simde_mm_mask_roundscale_ss(src, k, a, b, imm8);
|
|
if (HEDLEY_LIKELY(x == 0))
|
|
fesetenv(&envp);
|
|
#else
|
|
r = simde_mm_mask_roundscale_ss(src, k, a, b, imm8);
|
|
#endif
|
|
}
|
|
else {
|
|
r = simde_mm_mask_roundscale_ss(src, k, a, b, imm8);
|
|
}
|
|
|
|
return r;
|
|
}
|
|
#endif
|
|
#if defined(SIMDE_X86_AVX512F_ENABLE_NATIVE_ALIASES)
|
|
#undef _mm_mask_roundscale_round_ss
|
|
#define _mm_mask_roundscale_round_ss(src, k, a, b, imm8, sae) simde_mm_mask_roundscale_round_ss(src, k, a, b, imm8, sae)
|
|
#endif
|
|
|
|
#if defined(SIMDE_X86_AVX512F_NATIVE) && !defined(SIMDE_BUG_GCC_92035)
|
|
#define simde_mm_maskz_roundscale_round_ss(k, a, b, imm8, sae) _mm_maskz_roundscale_round_ss(k, a, b, imm8, sae)
|
|
#elif defined(SIMDE_FAST_EXCEPTIONS)
|
|
#define simde_mm_maskz_roundscale_round_ss(k, a, b, imm8, sae) simde_mm_maskz_roundscale_ss(k, a, b, imm8)
|
|
#elif defined(SIMDE_STATEMENT_EXPR_)
|
|
#if defined(SIMDE_HAVE_FENV_H)
|
|
#define simde_mm_maskz_roundscale_round_ss(k, a, b, imm8, sae) SIMDE_STATEMENT_EXPR_(({ \
|
|
simde__m128 simde_mm_maskz_roundscale_round_ss_r; \
|
|
\
|
|
if (sae & SIMDE_MM_FROUND_NO_EXC) { \
|
|
fenv_t simde_mm_maskz_roundscale_round_ss_envp; \
|
|
int simde_mm_maskz_roundscale_round_ss_x = feholdexcept(&simde_mm_maskz_roundscale_round_ss_envp); \
|
|
simde_mm_maskz_roundscale_round_ss_r = simde_mm_maskz_roundscale_ss(k, a, b, imm8); \
|
|
if (HEDLEY_LIKELY(simde_mm_maskz_roundscale_round_ss_x == 0)) \
|
|
fesetenv(&simde_mm_maskz_roundscale_round_ss_envp); \
|
|
} \
|
|
else { \
|
|
simde_mm_maskz_roundscale_round_ss_r = simde_mm_maskz_roundscale_ss(k, a, b, imm8); \
|
|
} \
|
|
\
|
|
simde_mm_maskz_roundscale_round_ss_r; \
|
|
}))
|
|
#else
|
|
#define simde_mm_maskz_roundscale_round_ss(k, a, b, imm8, sae) simde_mm_maskz_roundscale_ss(k, a, b, imm8)
|
|
#endif
|
|
#else
|
|
SIMDE_FUNCTION_ATTRIBUTES
|
|
simde__m128
|
|
simde_mm_maskz_roundscale_round_ss (simde__mmask8 k, simde__m128 a, simde__m128 b, int imm8, int sae)
|
|
SIMDE_REQUIRE_CONSTANT_RANGE(imm8, 0, 255)
|
|
SIMDE_REQUIRE_CONSTANT(sae) {
|
|
simde__m128 r;
|
|
|
|
if (sae & SIMDE_MM_FROUND_NO_EXC) {
|
|
#if defined(SIMDE_HAVE_FENV_H)
|
|
fenv_t envp;
|
|
int x = feholdexcept(&envp);
|
|
r = simde_mm_maskz_roundscale_ss(k, a, b, imm8);
|
|
if (HEDLEY_LIKELY(x == 0))
|
|
fesetenv(&envp);
|
|
#else
|
|
r = simde_mm_maskz_roundscale_ss(k, a, b, imm8);
|
|
#endif
|
|
}
|
|
else {
|
|
r = simde_mm_maskz_roundscale_ss(k, a, b, imm8);
|
|
}
|
|
|
|
return r;
|
|
}
|
|
#endif
|
|
#if defined(SIMDE_X86_AVX512F_ENABLE_NATIVE_ALIASES)
|
|
#undef _mm_maskz_roundscale_round_ss
|
|
#define _mm_maskz_roundscale_round_ss(k, a, b, imm8, sae) simde_mm_maskz_roundscale_round_ss(k, a, b, imm8, sae)
|
|
#endif
|
|
|
|
#if defined(SIMDE_X86_AVX512F_NATIVE)
|
|
#define simde_mm_roundscale_round_sd(a, b, imm8, sae) _mm_roundscale_round_sd(a, b, imm8, sae)
|
|
#elif defined(SIMDE_FAST_EXCEPTIONS)
|
|
#define simde_mm_roundscale_round_sd(a, b, imm8, sae) simde_mm_roundscale_sd(a, b, imm8)
|
|
#elif defined(SIMDE_STATEMENT_EXPR_)
|
|
#if defined(SIMDE_HAVE_FENV_H)
|
|
#define simde_mm_roundscale_round_sd(a, b, imm8, sae) SIMDE_STATEMENT_EXPR_(({ \
|
|
simde__m128d simde_mm_roundscale_round_sd_r; \
|
|
\
|
|
if (sae & SIMDE_MM_FROUND_NO_EXC) { \
|
|
fenv_t simde_mm_roundscale_round_sd_envp; \
|
|
int simde_mm_roundscale_round_sd_x = feholdexcept(&simde_mm_roundscale_round_sd_envp); \
|
|
simde_mm_roundscale_round_sd_r = simde_mm_roundscale_sd(a, b, imm8); \
|
|
if (HEDLEY_LIKELY(simde_mm_roundscale_round_sd_x == 0)) \
|
|
fesetenv(&simde_mm_roundscale_round_sd_envp); \
|
|
} \
|
|
else { \
|
|
simde_mm_roundscale_round_sd_r = simde_mm_roundscale_sd(a, b, imm8); \
|
|
} \
|
|
\
|
|
simde_mm_roundscale_round_sd_r; \
|
|
}))
|
|
#else
|
|
#define simde_mm_roundscale_round_sd(a, b, imm8, sae) simde_mm_roundscale_sd(a, b, imm8)
|
|
#endif
|
|
#else
|
|
SIMDE_FUNCTION_ATTRIBUTES
|
|
simde__m128d
|
|
simde_mm_roundscale_round_sd (simde__m128d a, simde__m128d b, int imm8, int sae)
|
|
SIMDE_REQUIRE_CONSTANT_RANGE(imm8, 0, 255)
|
|
SIMDE_REQUIRE_CONSTANT(sae) {
|
|
simde__m128d r;
|
|
|
|
if (sae & SIMDE_MM_FROUND_NO_EXC) {
|
|
#if defined(SIMDE_HAVE_FENV_H)
|
|
fenv_t envp;
|
|
int x = feholdexcept(&envp);
|
|
r = simde_mm_roundscale_sd(a, b, imm8);
|
|
if (HEDLEY_LIKELY(x == 0))
|
|
fesetenv(&envp);
|
|
#else
|
|
r = simde_mm_roundscale_sd(a, b, imm8);
|
|
#endif
|
|
}
|
|
else {
|
|
r = simde_mm_roundscale_sd(a, b, imm8);
|
|
}
|
|
|
|
return r;
|
|
}
|
|
#endif
|
|
#if defined(SIMDE_X86_AVX512F_ENABLE_NATIVE_ALIASES)
|
|
#undef _mm_roundscale_round_sd
|
|
#define _mm_roundscale_round_sd(a, b, imm8, sae) simde_mm_roundscale_round_sd(a, b, imm8, sae)
|
|
#endif
|
|
|
|
#if defined(SIMDE_X86_AVX512F_NATIVE) && !defined(SIMDE_BUG_GCC_92035)
|
|
#define simde_mm_mask_roundscale_round_sd(src, k, a, b, imm8, sae) _mm_mask_roundscale_round_sd(src, k, a, b, imm8, sae)
|
|
#elif defined(SIMDE_FAST_EXCEPTIONS)
|
|
#define simde_mm_mask_roundscale_round_sd(src, k, a, b, imm8, sae) simde_mm_mask_roundscale_sd(src, k, a, b, imm8)
|
|
#elif defined(SIMDE_STATEMENT_EXPR_)
|
|
#if defined(SIMDE_HAVE_FENV_H)
|
|
#define simde_mm_mask_roundscale_round_sd(src, k, a, b, imm8, sae) SIMDE_STATEMENT_EXPR_(({ \
|
|
simde__m128d simde_mm_mask_roundscale_round_sd_r; \
|
|
\
|
|
if (sae & SIMDE_MM_FROUND_NO_EXC) { \
|
|
fenv_t simde_mm_mask_roundscale_round_sd_envp; \
|
|
int simde_mm_mask_roundscale_round_sd_x = feholdexcept(&simde_mm_mask_roundscale_round_sd_envp); \
|
|
simde_mm_mask_roundscale_round_sd_r = simde_mm_mask_roundscale_sd(src, k, a, b, imm8); \
|
|
if (HEDLEY_LIKELY(simde_mm_mask_roundscale_round_sd_x == 0)) \
|
|
fesetenv(&simde_mm_mask_roundscale_round_sd_envp); \
|
|
} \
|
|
else { \
|
|
simde_mm_mask_roundscale_round_sd_r = simde_mm_mask_roundscale_sd(src, k, a, b, imm8); \
|
|
} \
|
|
\
|
|
simde_mm_mask_roundscale_round_sd_r; \
|
|
}))
|
|
#else
|
|
#define simde_mm_mask_roundscale_round_sd(src, k, a, b, imm8, sae) simde_mm_mask_roundscale_sd(src, k, a, b, imm8)
|
|
#endif
|
|
#else
|
|
SIMDE_FUNCTION_ATTRIBUTES
|
|
simde__m128d
|
|
simde_mm_mask_roundscale_round_sd (simde__m128d src, simde__mmask8 k, simde__m128d a, simde__m128d b, int imm8, int sae)
|
|
SIMDE_REQUIRE_CONSTANT_RANGE(imm8, 0, 255)
|
|
SIMDE_REQUIRE_CONSTANT(sae) {
|
|
simde__m128d r;
|
|
|
|
if (sae & SIMDE_MM_FROUND_NO_EXC) {
|
|
#if defined(SIMDE_HAVE_FENV_H)
|
|
fenv_t envp;
|
|
int x = feholdexcept(&envp);
|
|
r = simde_mm_mask_roundscale_sd(src, k, a, b, imm8);
|
|
if (HEDLEY_LIKELY(x == 0))
|
|
fesetenv(&envp);
|
|
#else
|
|
r = simde_mm_mask_roundscale_sd(src, k, a, b, imm8);
|
|
#endif
|
|
}
|
|
else {
|
|
r = simde_mm_mask_roundscale_sd(src, k, a, b, imm8);
|
|
}
|
|
|
|
return r;
|
|
}
|
|
#endif
|
|
#if defined(SIMDE_X86_AVX512F_ENABLE_NATIVE_ALIASES)
|
|
#undef _mm_mask_roundscale_round_sd
|
|
#define _mm_mask_roundscale_round_sd(src, k, a, b, imm8, sae) simde_mm_mask_roundscale_round_sd(src, k, a, b, imm8, sae)
|
|
#endif
|
|
|
|
#if defined(SIMDE_X86_AVX512F_NATIVE) && !defined(SIMDE_BUG_GCC_92035)
|
|
#define simde_mm_maskz_roundscale_round_sd(k, a, b, imm8, sae) _mm_maskz_roundscale_round_sd(k, a, b, imm8, sae)
|
|
#elif defined(SIMDE_FAST_EXCEPTIONS)
|
|
#define simde_mm_maskz_roundscale_round_sd(k, a, b, imm8, sae) simde_mm_maskz_roundscale_sd(k, a, b, imm8)
|
|
#elif defined(SIMDE_STATEMENT_EXPR_)
|
|
#if defined(SIMDE_HAVE_FENV_H)
|
|
#define simde_mm_maskz_roundscale_round_sd(k, a, b, imm8, sae) SIMDE_STATEMENT_EXPR_(({ \
|
|
simde__m128d simde_mm_maskz_roundscale_round_sd_r; \
|
|
\
|
|
if (sae & SIMDE_MM_FROUND_NO_EXC) { \
|
|
fenv_t simde_mm_maskz_roundscale_round_sd_envp; \
|
|
int simde_mm_maskz_roundscale_round_sd_x = feholdexcept(&simde_mm_maskz_roundscale_round_sd_envp); \
|
|
simde_mm_maskz_roundscale_round_sd_r = simde_mm_maskz_roundscale_sd(k, a, b, imm8); \
|
|
if (HEDLEY_LIKELY(simde_mm_maskz_roundscale_round_sd_x == 0)) \
|
|
fesetenv(&simde_mm_maskz_roundscale_round_sd_envp); \
|
|
} \
|
|
else { \
|
|
simde_mm_maskz_roundscale_round_sd_r = simde_mm_maskz_roundscale_sd(k, a, b, imm8); \
|
|
} \
|
|
\
|
|
simde_mm_maskz_roundscale_round_sd_r; \
|
|
}))
|
|
#else
|
|
#define simde_mm_maskz_roundscale_round_sd(k, a, b, imm8, sae) simde_mm_maskz_roundscale_sd(k, a, b, imm8)
|
|
#endif
|
|
#else
|
|
SIMDE_FUNCTION_ATTRIBUTES
|
|
simde__m128d
|
|
simde_mm_maskz_roundscale_round_sd (simde__mmask8 k, simde__m128d a, simde__m128d b, int imm8, int sae)
|
|
SIMDE_REQUIRE_CONSTANT_RANGE(imm8, 0, 255)
|
|
SIMDE_REQUIRE_CONSTANT(sae) {
|
|
simde__m128d r;
|
|
|
|
if (sae & SIMDE_MM_FROUND_NO_EXC) {
|
|
#if defined(SIMDE_HAVE_FENV_H)
|
|
fenv_t envp;
|
|
int x = feholdexcept(&envp);
|
|
r = simde_mm_maskz_roundscale_sd(k, a, b, imm8);
|
|
if (HEDLEY_LIKELY(x == 0))
|
|
fesetenv(&envp);
|
|
#else
|
|
r = simde_mm_maskz_roundscale_sd(k, a, b, imm8);
|
|
#endif
|
|
}
|
|
else {
|
|
r = simde_mm_maskz_roundscale_sd(k, a, b, imm8);
|
|
}
|
|
|
|
return r;
|
|
}
|
|
#endif
|
|
#if defined(SIMDE_X86_AVX512F_ENABLE_NATIVE_ALIASES)
|
|
#undef _mm_maskz_roundscale_round_sd
|
|
#define _mm_maskz_roundscale_round_sd(k, a, b, imm8, sae) simde_mm_maskz_roundscale_round_sd(k, a, b, imm8, sae)
|
|
#endif
|
|
|
|
SIMDE_END_DECLS_
|
|
HEDLEY_DIAGNOSTIC_POP
|
|
|
|
#endif /* !defined(SIMDE_X86_AVX512_ROUNDSCALE_ROUND_H) */
|