[avx512] rename gcc intrinsics to be align with gcc format

rename the gcc intrinsics suffix : _mask ->_round

Differential Revision: http://reviews.llvm.org/D15284

llvm-svn: 254906
This commit is contained in:
Asaf Badouh 2015-12-07 13:14:22 +00:00
parent d38ba8c80c
commit 3e5111e313
2 changed files with 72 additions and 72 deletions

View File

@ -1300,18 +1300,18 @@ TARGET_BUILTIN(__builtin_ia32_subps512_mask, "V16fV16fV16fV16fUsIi", "", "avx512
TARGET_BUILTIN(__builtin_ia32_pmaddubsw512_mask, "V32sV64cV64cV32sUi", "", "avx512bw")
TARGET_BUILTIN(__builtin_ia32_pmaddwd512_mask, "V16iV32sV32sV16iUs", "", "avx512bw")
TARGET_BUILTIN(__builtin_ia32_addss_mask, "V4fV4fV4fV4fUcIi", "", "avx512f")
TARGET_BUILTIN(__builtin_ia32_divss_mask, "V4fV4fV4fV4fUcIi", "", "avx512f")
TARGET_BUILTIN(__builtin_ia32_mulss_mask, "V4fV4fV4fV4fUcIi", "", "avx512f")
TARGET_BUILTIN(__builtin_ia32_subss_mask, "V4fV4fV4fV4fUcIi", "", "avx512f")
TARGET_BUILTIN(__builtin_ia32_maxss_mask, "V4fV4fV4fV4fUcIi", "", "avx512f")
TARGET_BUILTIN(__builtin_ia32_minss_mask, "V4fV4fV4fV4fUcIi", "", "avx512f")
TARGET_BUILTIN(__builtin_ia32_addsd_mask, "V2dV2dV2dV2dUcIi", "", "avx512f")
TARGET_BUILTIN(__builtin_ia32_divsd_mask, "V2dV2dV2dV2dUcIi", "", "avx512f")
TARGET_BUILTIN(__builtin_ia32_mulsd_mask, "V2dV2dV2dV2dUcIi", "", "avx512f")
TARGET_BUILTIN(__builtin_ia32_subsd_mask, "V2dV2dV2dV2dUcIi", "", "avx512f")
TARGET_BUILTIN(__builtin_ia32_maxsd_mask, "V2dV2dV2dV2dUcIi", "", "avx512f")
TARGET_BUILTIN(__builtin_ia32_minsd_mask, "V2dV2dV2dV2dUcIi", "", "avx512f")
TARGET_BUILTIN(__builtin_ia32_addss_round, "V4fV4fV4fV4fUcIi", "", "avx512f")
TARGET_BUILTIN(__builtin_ia32_divss_round, "V4fV4fV4fV4fUcIi", "", "avx512f")
TARGET_BUILTIN(__builtin_ia32_mulss_round, "V4fV4fV4fV4fUcIi", "", "avx512f")
TARGET_BUILTIN(__builtin_ia32_subss_round, "V4fV4fV4fV4fUcIi", "", "avx512f")
TARGET_BUILTIN(__builtin_ia32_maxss_round, "V4fV4fV4fV4fUcIi", "", "avx512f")
TARGET_BUILTIN(__builtin_ia32_minss_round, "V4fV4fV4fV4fUcIi", "", "avx512f")
TARGET_BUILTIN(__builtin_ia32_addsd_round, "V2dV2dV2dV2dUcIi", "", "avx512f")
TARGET_BUILTIN(__builtin_ia32_divsd_round, "V2dV2dV2dV2dUcIi", "", "avx512f")
TARGET_BUILTIN(__builtin_ia32_mulsd_round, "V2dV2dV2dV2dUcIi", "", "avx512f")
TARGET_BUILTIN(__builtin_ia32_subsd_round, "V2dV2dV2dV2dUcIi", "", "avx512f")
TARGET_BUILTIN(__builtin_ia32_maxsd_round, "V2dV2dV2dV2dUcIi", "", "avx512f")
TARGET_BUILTIN(__builtin_ia32_minsd_round, "V2dV2dV2dV2dUcIi", "", "avx512f")
TARGET_BUILTIN(__builtin_ia32_addpd128_mask, "V2dV2dV2dV2dUc", "", "avx512vl")
TARGET_BUILTIN(__builtin_ia32_addpd256_mask, "V4dV4dV4dV4dUc", "", "avx512vl")

View File

@ -569,7 +569,7 @@ _mm512_max_ps(__m512 __A, __m512 __B)
static __inline__ __m128 __DEFAULT_FN_ATTRS
_mm_mask_max_ss(__m128 __W, __mmask8 __U,__m128 __A, __m128 __B) {
return (__m128) __builtin_ia32_maxss_mask ((__v4sf) __A,
return (__m128) __builtin_ia32_maxss_round ((__v4sf) __A,
(__v4sf) __B,
(__v4sf) __W,
(__mmask8) __U,
@ -578,7 +578,7 @@ _mm_mask_max_ss(__m128 __W, __mmask8 __U,__m128 __A, __m128 __B) {
static __inline__ __m128 __DEFAULT_FN_ATTRS
_mm_maskz_max_ss(__mmask8 __U,__m128 __A, __m128 __B) {
return (__m128) __builtin_ia32_maxss_mask ((__v4sf) __A,
return (__m128) __builtin_ia32_maxss_round ((__v4sf) __A,
(__v4sf) __B,
(__v4sf) _mm_setzero_ps (),
(__mmask8) __U,
@ -586,20 +586,20 @@ _mm_maskz_max_ss(__mmask8 __U,__m128 __A, __m128 __B) {
}
#define _mm_max_round_ss(__A, __B, __R) __extension__ ({ \
(__m128) __builtin_ia32_maxss_mask ((__v4sf) __A, (__v4sf) __B, \
(__m128) __builtin_ia32_maxss_round ((__v4sf) __A, (__v4sf) __B, \
(__v4sf) _mm_setzero_ps(), (__mmask8) -1, __R); })
#define _mm_mask_max_round_ss(__W, __U, __A, __B, __R) __extension__ ({ \
(__m128) __builtin_ia32_maxss_mask ((__v4sf) __A, (__v4sf) __B, \
(__m128) __builtin_ia32_maxss_round ((__v4sf) __A, (__v4sf) __B, \
(__v4sf) __W, (__mmask8) __U,__R); })
#define _mm_maskz_max_round_ss(__U, __A, __B, __R) __extension__ ({ \
(__m128) __builtin_ia32_maxss_mask ((__v4sf) __A, (__v4sf) __B, \
(__m128) __builtin_ia32_maxss_round ((__v4sf) __A, (__v4sf) __B, \
(__v4sf) _mm_setzero_ps(), (__mmask8) __U,__R); })
static __inline__ __m128d __DEFAULT_FN_ATTRS
_mm_mask_max_sd(__m128d __W, __mmask8 __U,__m128d __A, __m128d __B) {
return (__m128d) __builtin_ia32_maxsd_mask ((__v2df) __A,
return (__m128d) __builtin_ia32_maxsd_round ((__v2df) __A,
(__v2df) __B,
(__v2df) __W,
(__mmask8) __U,
@ -608,7 +608,7 @@ _mm_mask_max_sd(__m128d __W, __mmask8 __U,__m128d __A, __m128d __B) {
static __inline__ __m128d __DEFAULT_FN_ATTRS
_mm_maskz_max_sd(__mmask8 __U,__m128d __A, __m128d __B) {
return (__m128d) __builtin_ia32_maxsd_mask ((__v2df) __A,
return (__m128d) __builtin_ia32_maxsd_round ((__v2df) __A,
(__v2df) __B,
(__v2df) _mm_setzero_pd (),
(__mmask8) __U,
@ -616,15 +616,15 @@ _mm_maskz_max_sd(__mmask8 __U,__m128d __A, __m128d __B) {
}
#define _mm_max_round_sd(__A, __B, __R) __extension__ ({ \
(__m128d) __builtin_ia32_maxsd_mask ((__v2df) __A, (__v2df) __B, \
(__m128d) __builtin_ia32_maxsd_round ((__v2df) __A, (__v2df) __B, \
(__v2df) _mm_setzero_pd(), (__mmask8) -1, __R); })
#define _mm_mask_max_round_sd(__W, __U, __A, __B, __R) __extension__ ({ \
(__m128d) __builtin_ia32_maxsd_mask ((__v2df) __A, (__v2df) __B, \
(__m128d) __builtin_ia32_maxsd_round ((__v2df) __A, (__v2df) __B, \
(__v2df) __W, (__mmask8) __U,__R); })
#define _mm_maskz_max_round_sd(__U, __A, __B, __R) __extension__ ({ \
(__m128d) __builtin_ia32_maxsd_mask ((__v2df) __A, (__v2df) __B, \
(__m128d) __builtin_ia32_maxsd_round ((__v2df) __A, (__v2df) __B, \
(__v2df) _mm_setzero_pd(), (__mmask8) __U,__R); })
static __inline __m512i
@ -692,7 +692,7 @@ _mm512_min_ps(__m512 __A, __m512 __B)
static __inline__ __m128 __DEFAULT_FN_ATTRS
_mm_mask_min_ss(__m128 __W, __mmask8 __U,__m128 __A, __m128 __B) {
return (__m128) __builtin_ia32_minss_mask ((__v4sf) __A,
return (__m128) __builtin_ia32_minss_round ((__v4sf) __A,
(__v4sf) __B,
(__v4sf) __W,
(__mmask8) __U,
@ -701,7 +701,7 @@ _mm_mask_min_ss(__m128 __W, __mmask8 __U,__m128 __A, __m128 __B) {
static __inline__ __m128 __DEFAULT_FN_ATTRS
_mm_maskz_min_ss(__mmask8 __U,__m128 __A, __m128 __B) {
return (__m128) __builtin_ia32_minss_mask ((__v4sf) __A,
return (__m128) __builtin_ia32_minss_round ((__v4sf) __A,
(__v4sf) __B,
(__v4sf) _mm_setzero_ps (),
(__mmask8) __U,
@ -709,20 +709,20 @@ _mm_maskz_min_ss(__mmask8 __U,__m128 __A, __m128 __B) {
}
#define _mm_min_round_ss(__A, __B, __R) __extension__ ({ \
(__m128) __builtin_ia32_minss_mask ((__v4sf) __A, (__v4sf) __B, \
(__m128) __builtin_ia32_minss_round ((__v4sf) __A, (__v4sf) __B, \
(__v4sf) _mm_setzero_ps(), (__mmask8) -1, __R); })
#define _mm_mask_min_round_ss(__W, __U, __A, __B, __R) __extension__ ({ \
(__m128) __builtin_ia32_minss_mask ((__v4sf) __A, (__v4sf) __B, \
(__m128) __builtin_ia32_minss_round ((__v4sf) __A, (__v4sf) __B, \
(__v4sf) __W, (__mmask8) __U,__R); })
#define _mm_maskz_min_round_ss(__U, __A, __B, __R) __extension__ ({ \
(__m128) __builtin_ia32_minss_mask ((__v4sf) __A, (__v4sf) __B, \
(__m128) __builtin_ia32_minss_round ((__v4sf) __A, (__v4sf) __B, \
(__v4sf) _mm_setzero_ps(), (__mmask8) __U,__R); })
static __inline__ __m128d __DEFAULT_FN_ATTRS
_mm_mask_min_sd(__m128d __W, __mmask8 __U,__m128d __A, __m128d __B) {
return (__m128d) __builtin_ia32_minsd_mask ((__v2df) __A,
return (__m128d) __builtin_ia32_minsd_round ((__v2df) __A,
(__v2df) __B,
(__v2df) __W,
(__mmask8) __U,
@ -731,7 +731,7 @@ _mm_mask_min_sd(__m128d __W, __mmask8 __U,__m128d __A, __m128d __B) {
static __inline__ __m128d __DEFAULT_FN_ATTRS
_mm_maskz_min_sd(__mmask8 __U,__m128d __A, __m128d __B) {
return (__m128d) __builtin_ia32_minsd_mask ((__v2df) __A,
return (__m128d) __builtin_ia32_minsd_round ((__v2df) __A,
(__v2df) __B,
(__v2df) _mm_setzero_pd (),
(__mmask8) __U,
@ -739,15 +739,15 @@ _mm_maskz_min_sd(__mmask8 __U,__m128d __A, __m128d __B) {
}
#define _mm_min_round_sd(__A, __B, __R) __extension__ ({ \
(__m128d) __builtin_ia32_minsd_mask ((__v2df) __A, (__v2df) __B, \
(__m128d) __builtin_ia32_minsd_round ((__v2df) __A, (__v2df) __B, \
(__v2df) _mm_setzero_pd(), (__mmask8) -1, __R); })
#define _mm_mask_min_round_sd(__W, __U, __A, __B, __R) __extension__ ({ \
(__m128d) __builtin_ia32_minsd_mask ((__v2df) __A, (__v2df) __B, \
(__m128d) __builtin_ia32_minsd_round ((__v2df) __A, (__v2df) __B, \
(__v2df) __W, (__mmask8) __U,__R); })
#define _mm_maskz_min_round_sd(__U, __A, __B, __R) __extension__ ({ \
(__m128d) __builtin_ia32_minsd_mask ((__v2df) __A, (__v2df) __B, \
(__m128d) __builtin_ia32_minsd_round ((__v2df) __A, (__v2df) __B, \
(__v2df) _mm_setzero_pd(), (__mmask8) __U,__R); })
static __inline __m512i
@ -1019,7 +1019,7 @@ _mm512_abs_epi32(__m512i __A)
static __inline__ __m128 __DEFAULT_FN_ATTRS
_mm_mask_add_ss(__m128 __W, __mmask8 __U,__m128 __A, __m128 __B) {
return (__m128) __builtin_ia32_addss_mask ((__v4sf) __A,
return (__m128) __builtin_ia32_addss_round ((__v4sf) __A,
(__v4sf) __B,
(__v4sf) __W,
(__mmask8) __U,
@ -1028,7 +1028,7 @@ _mm_mask_add_ss(__m128 __W, __mmask8 __U,__m128 __A, __m128 __B) {
static __inline__ __m128 __DEFAULT_FN_ATTRS
_mm_maskz_add_ss(__mmask8 __U,__m128 __A, __m128 __B) {
return (__m128) __builtin_ia32_addss_mask ((__v4sf) __A,
return (__m128) __builtin_ia32_addss_round ((__v4sf) __A,
(__v4sf) __B,
(__v4sf) _mm_setzero_ps (),
(__mmask8) __U,
@ -1036,20 +1036,20 @@ _mm_maskz_add_ss(__mmask8 __U,__m128 __A, __m128 __B) {
}
#define _mm_add_round_ss(__A, __B, __R) __extension__ ({ \
(__m128) __builtin_ia32_addss_mask ((__v4sf) __A, (__v4sf) __B, \
(__m128) __builtin_ia32_addss_round ((__v4sf) __A, (__v4sf) __B, \
(__v4sf) _mm_setzero_ps(), (__mmask8) -1, __R); })
#define _mm_mask_add_round_ss(__W, __U, __A, __B, __R) __extension__ ({ \
(__m128) __builtin_ia32_addss_mask ((__v4sf) __A, (__v4sf) __B, \
(__m128) __builtin_ia32_addss_round ((__v4sf) __A, (__v4sf) __B, \
(__v4sf) __W, (__mmask8) __U,__R); })
#define _mm_maskz_add_round_ss(__U, __A, __B, __R) __extension__ ({ \
(__m128) __builtin_ia32_addss_mask ((__v4sf) __A, (__v4sf) __B, \
(__m128) __builtin_ia32_addss_round ((__v4sf) __A, (__v4sf) __B, \
(__v4sf) _mm_setzero_ps(), (__mmask8) __U,__R); })
static __inline__ __m128d __DEFAULT_FN_ATTRS
_mm_mask_add_sd(__m128d __W, __mmask8 __U,__m128d __A, __m128d __B) {
return (__m128d) __builtin_ia32_addsd_mask ((__v2df) __A,
return (__m128d) __builtin_ia32_addsd_round ((__v2df) __A,
(__v2df) __B,
(__v2df) __W,
(__mmask8) __U,
@ -1058,22 +1058,22 @@ _mm_mask_add_sd(__m128d __W, __mmask8 __U,__m128d __A, __m128d __B) {
static __inline__ __m128d __DEFAULT_FN_ATTRS
_mm_maskz_add_sd(__mmask8 __U,__m128d __A, __m128d __B) {
return (__m128d) __builtin_ia32_addsd_mask ((__v2df) __A,
return (__m128d) __builtin_ia32_addsd_round ((__v2df) __A,
(__v2df) __B,
(__v2df) _mm_setzero_pd (),
(__mmask8) __U,
_MM_FROUND_CUR_DIRECTION);
}
#define _mm_add_round_sd(__A, __B, __R) __extension__ ({ \
(__m128d) __builtin_ia32_addsd_mask ((__v2df) __A, (__v2df) __B, \
(__m128d) __builtin_ia32_addsd_round ((__v2df) __A, (__v2df) __B, \
(__v2df) _mm_setzero_pd(), (__mmask8) -1, __R); })
#define _mm_mask_add_round_sd(__W, __U, __A, __B, __R) __extension__ ({ \
(__m128d) __builtin_ia32_addsd_mask ((__v2df) __A, (__v2df) __B, \
(__m128d) __builtin_ia32_addsd_round ((__v2df) __A, (__v2df) __B, \
(__v2df) __W, (__mmask8) __U,__R); })
#define _mm_maskz_add_round_sd(__U, __A, __B, __R) __extension__ ({ \
(__m128d) __builtin_ia32_addsd_mask ((__v2df) __A, (__v2df) __B, \
(__m128d) __builtin_ia32_addsd_round ((__v2df) __A, (__v2df) __B, \
(__v2df) _mm_setzero_pd(), (__mmask8) __U,__R); })
static __inline__ __m512d __DEFAULT_FN_ATTRS
@ -1138,7 +1138,7 @@ _mm512_maskz_add_ps(__mmask16 __U, __m512 __A, __m512 __B) {
static __inline__ __m128 __DEFAULT_FN_ATTRS
_mm_mask_sub_ss(__m128 __W, __mmask8 __U,__m128 __A, __m128 __B) {
return (__m128) __builtin_ia32_subss_mask ((__v4sf) __A,
return (__m128) __builtin_ia32_subss_round ((__v4sf) __A,
(__v4sf) __B,
(__v4sf) __W,
(__mmask8) __U,
@ -1147,27 +1147,27 @@ _mm_mask_sub_ss(__m128 __W, __mmask8 __U,__m128 __A, __m128 __B) {
static __inline__ __m128 __DEFAULT_FN_ATTRS
_mm_maskz_sub_ss(__mmask8 __U,__m128 __A, __m128 __B) {
return (__m128) __builtin_ia32_subss_mask ((__v4sf) __A,
return (__m128) __builtin_ia32_subss_round ((__v4sf) __A,
(__v4sf) __B,
(__v4sf) _mm_setzero_ps (),
(__mmask8) __U,
_MM_FROUND_CUR_DIRECTION);
}
#define _mm_sub_round_ss(__A, __B, __R) __extension__ ({ \
(__m128) __builtin_ia32_subss_mask ((__v4sf) __A, (__v4sf) __B, \
(__m128) __builtin_ia32_subss_round ((__v4sf) __A, (__v4sf) __B, \
(__v4sf) _mm_setzero_ps(), (__mmask8) -1, __R); })
#define _mm_mask_sub_round_ss(__W, __U, __A, __B, __R) __extension__ ({ \
(__m128) __builtin_ia32_subss_mask ((__v4sf) __A, (__v4sf) __B, \
(__m128) __builtin_ia32_subss_round ((__v4sf) __A, (__v4sf) __B, \
(__v4sf) __W, (__mmask8) __U,__R); })
#define _mm_maskz_sub_round_ss(__U, __A, __B, __R) __extension__ ({ \
(__m128) __builtin_ia32_subss_mask ((__v4sf) __A, (__v4sf) __B, \
(__m128) __builtin_ia32_subss_round ((__v4sf) __A, (__v4sf) __B, \
(__v4sf) _mm_setzero_ps(), (__mmask8) __U,__R); })
static __inline__ __m128d __DEFAULT_FN_ATTRS
_mm_mask_sub_sd(__m128d __W, __mmask8 __U,__m128d __A, __m128d __B) {
return (__m128d) __builtin_ia32_subsd_mask ((__v2df) __A,
return (__m128d) __builtin_ia32_subsd_round ((__v2df) __A,
(__v2df) __B,
(__v2df) __W,
(__mmask8) __U,
@ -1176,7 +1176,7 @@ _mm_mask_sub_sd(__m128d __W, __mmask8 __U,__m128d __A, __m128d __B) {
static __inline__ __m128d __DEFAULT_FN_ATTRS
_mm_maskz_sub_sd(__mmask8 __U,__m128d __A, __m128d __B) {
return (__m128d) __builtin_ia32_subsd_mask ((__v2df) __A,
return (__m128d) __builtin_ia32_subsd_round ((__v2df) __A,
(__v2df) __B,
(__v2df) _mm_setzero_pd (),
(__mmask8) __U,
@ -1184,15 +1184,15 @@ _mm_maskz_sub_sd(__mmask8 __U,__m128d __A, __m128d __B) {
}
#define _mm_sub_round_sd(__A, __B, __R) __extension__ ({ \
(__m128d) __builtin_ia32_subsd_mask ((__v2df) __A, (__v2df) __B, \
(__m128d) __builtin_ia32_subsd_round ((__v2df) __A, (__v2df) __B, \
(__v2df) _mm_setzero_pd(), (__mmask8) -1, __R); })
#define _mm_mask_sub_round_sd(__W, __U, __A, __B, __R) __extension__ ({ \
(__m128d) __builtin_ia32_subsd_mask ((__v2df) __A, (__v2df) __B, \
(__m128d) __builtin_ia32_subsd_round ((__v2df) __A, (__v2df) __B, \
(__v2df) __W, (__mmask8) __U,__R); })
#define _mm_maskz_sub_round_sd(__U, __A, __B, __R) __extension__ ({ \
(__m128d) __builtin_ia32_subsd_mask ((__v2df) __A, (__v2df) __B, \
(__m128d) __builtin_ia32_subsd_round ((__v2df) __A, (__v2df) __B, \
(__v2df) _mm_setzero_pd(), (__mmask8) __U,__R); })
static __inline__ __m512d __DEFAULT_FN_ATTRS
@ -1259,7 +1259,7 @@ _mm512_maskz_sub_ps(__mmask16 __U, __m512 __A, __m512 __B) {
static __inline__ __m128 __DEFAULT_FN_ATTRS
_mm_mask_mul_ss(__m128 __W, __mmask8 __U,__m128 __A, __m128 __B) {
return (__m128) __builtin_ia32_mulss_mask ((__v4sf) __A,
return (__m128) __builtin_ia32_mulss_round ((__v4sf) __A,
(__v4sf) __B,
(__v4sf) __W,
(__mmask8) __U,
@ -1268,27 +1268,27 @@ _mm_mask_mul_ss(__m128 __W, __mmask8 __U,__m128 __A, __m128 __B) {
static __inline__ __m128 __DEFAULT_FN_ATTRS
_mm_maskz_mul_ss(__mmask8 __U,__m128 __A, __m128 __B) {
return (__m128) __builtin_ia32_mulss_mask ((__v4sf) __A,
return (__m128) __builtin_ia32_mulss_round ((__v4sf) __A,
(__v4sf) __B,
(__v4sf) _mm_setzero_ps (),
(__mmask8) __U,
_MM_FROUND_CUR_DIRECTION);
}
#define _mm_mul_round_ss(__A, __B, __R) __extension__ ({ \
(__m128) __builtin_ia32_mulss_mask ((__v4sf) __A, (__v4sf) __B, \
(__m128) __builtin_ia32_mulss_round ((__v4sf) __A, (__v4sf) __B, \
(__v4sf) _mm_setzero_ps(), (__mmask8) -1, __R); })
#define _mm_mask_mul_round_ss(__W, __U, __A, __B, __R) __extension__ ({ \
(__m128) __builtin_ia32_mulss_mask ((__v4sf) __A, (__v4sf) __B, \
(__m128) __builtin_ia32_mulss_round ((__v4sf) __A, (__v4sf) __B, \
(__v4sf) __W, (__mmask8) __U,__R); })
#define _mm_maskz_mul_round_ss(__U, __A, __B, __R) __extension__ ({ \
(__m128) __builtin_ia32_mulss_mask ((__v4sf) __A, (__v4sf) __B, \
(__m128) __builtin_ia32_mulss_round ((__v4sf) __A, (__v4sf) __B, \
(__v4sf) _mm_setzero_ps(), (__mmask8) __U,__R); })
static __inline__ __m128d __DEFAULT_FN_ATTRS
_mm_mask_mul_sd(__m128d __W, __mmask8 __U,__m128d __A, __m128d __B) {
return (__m128d) __builtin_ia32_mulsd_mask ((__v2df) __A,
return (__m128d) __builtin_ia32_mulsd_round ((__v2df) __A,
(__v2df) __B,
(__v2df) __W,
(__mmask8) __U,
@ -1297,7 +1297,7 @@ _mm_mask_mul_sd(__m128d __W, __mmask8 __U,__m128d __A, __m128d __B) {
static __inline__ __m128d __DEFAULT_FN_ATTRS
_mm_maskz_mul_sd(__mmask8 __U,__m128d __A, __m128d __B) {
return (__m128d) __builtin_ia32_mulsd_mask ((__v2df) __A,
return (__m128d) __builtin_ia32_mulsd_round ((__v2df) __A,
(__v2df) __B,
(__v2df) _mm_setzero_pd (),
(__mmask8) __U,
@ -1305,15 +1305,15 @@ _mm_maskz_mul_sd(__mmask8 __U,__m128d __A, __m128d __B) {
}
#define _mm_mul_round_sd(__A, __B, __R) __extension__ ({ \
(__m128d) __builtin_ia32_mulsd_mask ((__v2df) __A, (__v2df) __B, \
(__m128d) __builtin_ia32_mulsd_round ((__v2df) __A, (__v2df) __B, \
(__v2df) _mm_setzero_pd(), (__mmask8) -1, __R); })
#define _mm_mask_mul_round_sd(__W, __U, __A, __B, __R) __extension__ ({ \
(__m128d) __builtin_ia32_mulsd_mask ((__v2df) __A, (__v2df) __B, \
(__m128d) __builtin_ia32_mulsd_round ((__v2df) __A, (__v2df) __B, \
(__v2df) __W, (__mmask8) __U,__R); })
#define _mm_maskz_mul_round_sd(__U, __A, __B, __R) __extension__ ({ \
(__m128d) __builtin_ia32_mulsd_mask ((__v2df) __A, (__v2df) __B, \
(__m128d) __builtin_ia32_mulsd_round ((__v2df) __A, (__v2df) __B, \
(__v2df) _mm_setzero_pd(), (__mmask8) __U,__R); })
static __inline__ __m512d __DEFAULT_FN_ATTRS
@ -1380,7 +1380,7 @@ _mm512_maskz_mul_ps(__mmask16 __U, __m512 __A, __m512 __B) {
static __inline__ __m128 __DEFAULT_FN_ATTRS
_mm_mask_div_ss(__m128 __W, __mmask8 __U,__m128 __A, __m128 __B) {
return (__m128) __builtin_ia32_divss_mask ((__v4sf) __A,
return (__m128) __builtin_ia32_divss_round ((__v4sf) __A,
(__v4sf) __B,
(__v4sf) __W,
(__mmask8) __U,
@ -1389,7 +1389,7 @@ _mm_mask_div_ss(__m128 __W, __mmask8 __U,__m128 __A, __m128 __B) {
static __inline__ __m128 __DEFAULT_FN_ATTRS
_mm_maskz_div_ss(__mmask8 __U,__m128 __A, __m128 __B) {
return (__m128) __builtin_ia32_divss_mask ((__v4sf) __A,
return (__m128) __builtin_ia32_divss_round ((__v4sf) __A,
(__v4sf) __B,
(__v4sf) _mm_setzero_ps (),
(__mmask8) __U,
@ -1397,20 +1397,20 @@ _mm_maskz_div_ss(__mmask8 __U,__m128 __A, __m128 __B) {
}
#define _mm_div_round_ss(__A, __B, __R) __extension__ ({ \
(__m128) __builtin_ia32_divss_mask ((__v4sf) __A, (__v4sf) __B, \
(__m128) __builtin_ia32_divss_round ((__v4sf) __A, (__v4sf) __B, \
(__v4sf) _mm_setzero_ps(), (__mmask8) -1, __R); })
#define _mm_mask_div_round_ss(__W, __U, __A, __B, __R) __extension__ ({ \
(__m128) __builtin_ia32_divss_mask ((__v4sf) __A, (__v4sf) __B, \
(__m128) __builtin_ia32_divss_round ((__v4sf) __A, (__v4sf) __B, \
(__v4sf) __W, (__mmask8) __U,__R); })
#define _mm_maskz_div_round_ss(__U, __A, __B, __R) __extension__ ({ \
(__m128) __builtin_ia32_divss_mask ((__v4sf) __A, (__v4sf) __B, \
(__m128) __builtin_ia32_divss_round ((__v4sf) __A, (__v4sf) __B, \
(__v4sf) _mm_setzero_ps(), (__mmask8) __U,__R); })
static __inline__ __m128d __DEFAULT_FN_ATTRS
_mm_mask_div_sd(__m128d __W, __mmask8 __U,__m128d __A, __m128d __B) {
return (__m128d) __builtin_ia32_divsd_mask ((__v2df) __A,
return (__m128d) __builtin_ia32_divsd_round ((__v2df) __A,
(__v2df) __B,
(__v2df) __W,
(__mmask8) __U,
@ -1419,7 +1419,7 @@ _mm_mask_div_sd(__m128d __W, __mmask8 __U,__m128d __A, __m128d __B) {
static __inline__ __m128d __DEFAULT_FN_ATTRS
_mm_maskz_div_sd(__mmask8 __U,__m128d __A, __m128d __B) {
return (__m128d) __builtin_ia32_divsd_mask ((__v2df) __A,
return (__m128d) __builtin_ia32_divsd_round ((__v2df) __A,
(__v2df) __B,
(__v2df) _mm_setzero_pd (),
(__mmask8) __U,
@ -1427,15 +1427,15 @@ _mm_maskz_div_sd(__mmask8 __U,__m128d __A, __m128d __B) {
}
#define _mm_div_round_sd(__A, __B, __R) __extension__ ({ \
(__m128d) __builtin_ia32_divsd_mask ((__v2df) __A, (__v2df) __B, \
(__m128d) __builtin_ia32_divsd_round ((__v2df) __A, (__v2df) __B, \
(__v2df) _mm_setzero_pd(), (__mmask8) -1, __R); })
#define _mm_mask_div_round_sd(__W, __U, __A, __B, __R) __extension__ ({ \
(__m128d) __builtin_ia32_divsd_mask ((__v2df) __A, (__v2df) __B, \
(__m128d) __builtin_ia32_divsd_round ((__v2df) __A, (__v2df) __B, \
(__v2df) __W, (__mmask8) __U,__R); })
#define _mm_maskz_div_round_sd(__U, __A, __B, __R) __extension__ ({ \
(__m128d) __builtin_ia32_divsd_mask ((__v2df) __A, (__v2df) __B, \
(__m128d) __builtin_ia32_divsd_round ((__v2df) __A, (__v2df) __B, \
(__v2df) _mm_setzero_pd(), (__mmask8) __U,__R); })
static __inline__ __m512d __DEFAULT_FN_ATTRS