[CLANG] [AVX512] [BUILTIN] Adding PSRA{W|WI}{128|256|512}.

Differential Revision: http://reviews.llvm.org/D17706

llvm-svn: 262481
This commit is contained in:
Michael Zuckerman 2016-03-02 12:06:06 +00:00
parent 927fdaee88
commit 3df95e711f
4 changed files with 160 additions and 0 deletions

View File

@ -1685,6 +1685,12 @@ TARGET_BUILTIN(__builtin_ia32_psrav4si_mask, "V4iV4iV4iV4iUc","","avx512vl")
TARGET_BUILTIN(__builtin_ia32_psrav8si_mask, "V8iV8iV8iV8iUc","","avx512vl") TARGET_BUILTIN(__builtin_ia32_psrav8si_mask, "V8iV8iV8iV8iUc","","avx512vl")
TARGET_BUILTIN(__builtin_ia32_psravq128_mask, "V2LLiV2LLiV2LLiV2LLiUc","","avx512vl") TARGET_BUILTIN(__builtin_ia32_psravq128_mask, "V2LLiV2LLiV2LLiV2LLiUc","","avx512vl")
TARGET_BUILTIN(__builtin_ia32_psravq256_mask, "V4LLiV4LLiV4LLiV4LLiUc","","avx512vl") TARGET_BUILTIN(__builtin_ia32_psravq256_mask, "V4LLiV4LLiV4LLiV4LLiUc","","avx512vl")
TARGET_BUILTIN(__builtin_ia32_psraw512_mask, "V32sV32sV8sV32sUi","","avx512bw")
TARGET_BUILTIN(__builtin_ia32_psrawi512_mask, "V32sV32sIiV32sUi","","avx512bw")
TARGET_BUILTIN(__builtin_ia32_psraw128_mask, "V8sV8sV8sV8sUc","","avx512bw,avx512vl")
TARGET_BUILTIN(__builtin_ia32_psraw256_mask, "V16sV16sV8sV16sUs","","avx512bw,avx512vl")
TARGET_BUILTIN(__builtin_ia32_psrawi128_mask, "V8sV8sIiV8sUc","","avx512bw,avx512vl")
TARGET_BUILTIN(__builtin_ia32_psrawi256_mask, "V16sV16sIiV16sUs","","avx512bw,avx512vl")
#undef BUILTIN #undef BUILTIN
#undef TARGET_BUILTIN #undef TARGET_BUILTIN

View File

@ -1778,6 +1778,57 @@ _mm512_maskz_srav_epi16 (__mmask32 __U, __m512i __A, __m512i __B)
_mm512_setzero_hi (), _mm512_setzero_hi (),
(__mmask32) __U); (__mmask32) __U);
} }
static __inline__ __m512i __DEFAULT_FN_ATTRS
_mm512_sra_epi16 (__m512i __A, __m128i __B)
{
return (__m512i) __builtin_ia32_psraw512_mask ((__v32hi) __A,
(__v8hi) __B,
(__v32hi)
_mm512_setzero_hi (),
(__mmask32) -1);
}
static __inline__ __m512i __DEFAULT_FN_ATTRS
_mm512_mask_sra_epi16 (__m512i __W, __mmask32 __U, __m512i __A,
__m128i __B)
{
return (__m512i) __builtin_ia32_psraw512_mask ((__v32hi) __A,
(__v8hi) __B,
(__v32hi) __W,
(__mmask32) __U);
}
static __inline__ __m512i __DEFAULT_FN_ATTRS
_mm512_maskz_sra_epi16 (__mmask32 __U, __m512i __A, __m128i __B)
{
return (__m512i) __builtin_ia32_psraw512_mask ((__v32hi) __A,
(__v8hi) __B,
(__v32hi)
_mm512_setzero_hi (),
(__mmask32) __U);
}
#define _mm512_srai_epi16( __A, __B) __extension__ ({ \
__builtin_ia32_psrawi512_mask ((__v32hi)( __A),( __B),\
(__v32hi)\
_mm512_setzero_hi (),\
(__mmask32) -2);\
})
#define _mm512_mask_srai_epi16( __W, __U, __A, __B) __extension__ ({ \
__builtin_ia32_psrawi512_mask ((__v32hi)( __A),( __B),\
(__v32hi)( __W),\
(__mmask32)( __U));\
})
#define _mm512_maskz_srai_epi16( __U, __A, __B) __extension__ ({ \
__builtin_ia32_psrawi512_mask ((__v32hi)( __A),( __B),\
(__v32hi)\
_mm512_setzero_hi (),\
(__mmask32)( __U));\
})
#undef __DEFAULT_FN_ATTRS #undef __DEFAULT_FN_ATTRS
#endif #endif

View File

@ -2715,6 +2715,72 @@ _mm_maskz_srav_epi16 (__mmask8 __U, __m128i __A, __m128i __B)
(__mmask8) __U); (__mmask8) __U);
} }
static __inline__ __m128i __DEFAULT_FN_ATTRS
_mm_mask_sra_epi16 (__m128i __W, __mmask8 __U, __m128i __A,
__m128i __B)
{
return (__m128i) __builtin_ia32_psraw128_mask ((__v8hi) __A,
(__v8hi) __B,
(__v8hi) __W,
(__mmask8) __U);
}
static __inline__ __m128i __DEFAULT_FN_ATTRS
_mm_maskz_sra_epi16 (__mmask8 __U, __m128i __A, __m128i __B)
{
return (__m128i) __builtin_ia32_psraw128_mask ((__v8hi) __A,
(__v8hi) __B,
(__v8hi)
_mm_setzero_si128 (),
(__mmask8) __U);
}
static __inline__ __m256i __DEFAULT_FN_ATTRS
_mm256_mask_sra_epi16 (__m256i __W, __mmask16 __U, __m256i __A,
__m128i __B)
{
return (__m256i) __builtin_ia32_psraw256_mask ((__v16hi) __A,
(__v8hi) __B,
(__v16hi) __W,
(__mmask16) __U);
}
static __inline__ __m256i __DEFAULT_FN_ATTRS
_mm256_maskz_sra_epi16 (__mmask16 __U, __m256i __A, __m128i __B)
{
return (__m256i) __builtin_ia32_psraw256_mask ((__v16hi) __A,
(__v8hi) __B,
(__v16hi)
_mm256_setzero_si256 (),
(__mmask16) __U);
}
#define _mm_mask_srai_epi16( __W, __U, __A, __imm) __extension__ ({ \
__builtin_ia32_psrawi128_mask ((__v8hi)( __A),( __imm),\
(__v8hi)( __W),\
(__mmask8)( __U));\
})
#define _mm_maskz_srai_epi16( __U, __A, __imm) __extension__ ({ \
__builtin_ia32_psrawi128_mask ((__v8hi)( __A),( __imm),\
(__v8hi)\
_mm_setzero_si128 (),\
(__mmask8)( __U));\
})
#define _mm256_mask_srai_epi16( __W, __U, __A, __imm) __extension__ ({ \
__builtin_ia32_psrawi256_mask ((__v16hi)( __A),( __imm),\
(__v16hi)( __W),\
(__mmask16)( __U));\
})
#define _mm256_maskz_srai_epi16( __U, __A, __imm) __extension__ ({ \
__builtin_ia32_psrawi256_mask ((__v16hi)( __A),( __imm),\
(__v16hi)\
_mm256_setzero_si256 (),\
(__mmask16)( __U));\
})
#undef __DEFAULT_FN_ATTRS #undef __DEFAULT_FN_ATTRS
#endif /* __AVX512VLBWINTRIN_H */ #endif /* __AVX512VLBWINTRIN_H */

View File

@ -1203,4 +1203,41 @@ __m512i test_mm512_maskz_srav_epi16(__mmask32 __U, __m512i __A, __m512i __B) {
return _mm512_maskz_srav_epi16(__U, __A, __B); return _mm512_maskz_srav_epi16(__U, __A, __B);
} }
__m512i test_mm512_sra_epi16(__m512i __A, __m128i __B) {
// CHECK-LABEL: @test_mm512_sra_epi16
// CHECK: @llvm.x86.avx512.mask.psra.w.512
return _mm512_sra_epi16(__A, __B);
}
__m512i test_mm512_mask_sra_epi16(__m512i __W, __mmask32 __U, __m512i __A, __m128i __B) {
// CHECK-LABEL: @test_mm512_mask_sra_epi16
// CHECK: @llvm.x86.avx512.mask.psra.w.512
return _mm512_mask_sra_epi16(__W, __U, __A, __B);
}
__m512i test_mm512_maskz_sra_epi16(__mmask32 __U, __m512i __A, __m128i __B) {
// CHECK-LABEL: @test_mm512_maskz_sra_epi16
// CHECK: @llvm.x86.avx512.mask.psra.w.512
return _mm512_maskz_sra_epi16(__U, __A, __B);
}
__m512i test_mm512_srai_epi16(__m512i __A) {
// CHECK-LABEL: @test_mm512_srai_epi16
// CHECK: @llvm.x86.avx512.mask.psra.wi.512
return _mm512_srai_epi16(__A, 5);
}
__m512i test_mm512_mask_srai_epi16(__m512i __W, __mmask32 __U, __m512i __A) {
// CHECK-LABEL: @test_mm512_mask_srai_epi16
// CHECK: @llvm.x86.avx512.mask.psra.wi.512
return _mm512_mask_srai_epi16(__W, __U, __A, 5);
}
__m512i test_mm512_maskz_srai_epi16(__mmask32 __U, __m512i __A) {
// CHECK-LABEL: @test_mm512_maskz_srai_epi16
// CHECK: @llvm.x86.avx512.mask.psra.wi.512
return _mm512_maskz_srai_epi16(__U, __A, 5);
}