1f58f3647b19c40455065c7395db82848d8830981Craig Topper/*===---- bmi2intrin.h - BMI2 intrinsics -----------------------------------=== 2f58f3647b19c40455065c7395db82848d8830981Craig Topper * 3f58f3647b19c40455065c7395db82848d8830981Craig Topper * Permission is hereby granted, free of charge, to any person obtaining a copy 4f58f3647b19c40455065c7395db82848d8830981Craig Topper * of this software and associated documentation files (the "Software"), to deal 5f58f3647b19c40455065c7395db82848d8830981Craig Topper * in the Software without restriction, including without limitation the rights 6f58f3647b19c40455065c7395db82848d8830981Craig Topper * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell 7f58f3647b19c40455065c7395db82848d8830981Craig Topper * copies of the Software, and to permit persons to whom the Software is 8f58f3647b19c40455065c7395db82848d8830981Craig Topper * furnished to do so, subject to the following conditions: 9f58f3647b19c40455065c7395db82848d8830981Craig Topper * 10f58f3647b19c40455065c7395db82848d8830981Craig Topper * The above copyright notice and this permission notice shall be included in 11f58f3647b19c40455065c7395db82848d8830981Craig Topper * all copies or substantial portions of the Software. 12f58f3647b19c40455065c7395db82848d8830981Craig Topper * 13f58f3647b19c40455065c7395db82848d8830981Craig Topper * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 14f58f3647b19c40455065c7395db82848d8830981Craig Topper * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 15f58f3647b19c40455065c7395db82848d8830981Craig Topper * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE 16f58f3647b19c40455065c7395db82848d8830981Craig Topper * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 17f58f3647b19c40455065c7395db82848d8830981Craig Topper * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 18f58f3647b19c40455065c7395db82848d8830981Craig Topper * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN 19f58f3647b19c40455065c7395db82848d8830981Craig Topper * THE SOFTWARE. 20f58f3647b19c40455065c7395db82848d8830981Craig Topper * 21f58f3647b19c40455065c7395db82848d8830981Craig Topper *===-----------------------------------------------------------------------=== 22f58f3647b19c40455065c7395db82848d8830981Craig Topper */ 23f58f3647b19c40455065c7395db82848d8830981Craig Topper 24f58f3647b19c40455065c7395db82848d8830981Craig Topper#if !defined __X86INTRIN_H && !defined __IMMINTRIN_H 25f58f3647b19c40455065c7395db82848d8830981Craig Topper#error "Never use <bmi2intrin.h> directly; include <x86intrin.h> instead." 26f58f3647b19c40455065c7395db82848d8830981Craig Topper#endif 27f58f3647b19c40455065c7395db82848d8830981Craig Topper 28f58f3647b19c40455065c7395db82848d8830981Craig Topper#ifndef __BMI2__ 29f58f3647b19c40455065c7395db82848d8830981Craig Topper# error "BMI2 instruction set not enabled" 30f58f3647b19c40455065c7395db82848d8830981Craig Topper#endif /* __BMI2__ */ 31f58f3647b19c40455065c7395db82848d8830981Craig Topper 32f58f3647b19c40455065c7395db82848d8830981Craig Topper#ifndef __BMI2INTRIN_H 33f58f3647b19c40455065c7395db82848d8830981Craig Topper#define __BMI2INTRIN_H 34f58f3647b19c40455065c7395db82848d8830981Craig Topper 35f58f3647b19c40455065c7395db82848d8830981Craig Topperstatic __inline__ unsigned int __attribute__((__always_inline__, __nodebug__)) 36f58f3647b19c40455065c7395db82848d8830981Craig Topper_bzhi_u32(unsigned int __X, unsigned int __Y) 37f58f3647b19c40455065c7395db82848d8830981Craig Topper{ 38f58f3647b19c40455065c7395db82848d8830981Craig Topper return __builtin_ia32_bzhi_si(__X, __Y); 39f58f3647b19c40455065c7395db82848d8830981Craig Topper} 40f58f3647b19c40455065c7395db82848d8830981Craig Topper 41f58f3647b19c40455065c7395db82848d8830981Craig Topperstatic __inline__ unsigned int __attribute__((__always_inline__, __nodebug__)) 42f58f3647b19c40455065c7395db82848d8830981Craig Topper_pdep_u32(unsigned int __X, unsigned int __Y) 43f58f3647b19c40455065c7395db82848d8830981Craig Topper{ 44f58f3647b19c40455065c7395db82848d8830981Craig Topper return __builtin_ia32_pdep_si(__X, __Y); 45f58f3647b19c40455065c7395db82848d8830981Craig Topper} 46f58f3647b19c40455065c7395db82848d8830981Craig Topper 47f58f3647b19c40455065c7395db82848d8830981Craig Topperstatic __inline__ unsigned int __attribute__((__always_inline__, __nodebug__)) 48f58f3647b19c40455065c7395db82848d8830981Craig Topper_pext_u32(unsigned int __X, unsigned int __Y) 49f58f3647b19c40455065c7395db82848d8830981Craig Topper{ 50f58f3647b19c40455065c7395db82848d8830981Craig Topper return __builtin_ia32_pext_si(__X, __Y); 51f58f3647b19c40455065c7395db82848d8830981Craig Topper} 52f58f3647b19c40455065c7395db82848d8830981Craig Topper 53f58f3647b19c40455065c7395db82848d8830981Craig Topper#ifdef __x86_64__ 54f58f3647b19c40455065c7395db82848d8830981Craig Topper 55f58f3647b19c40455065c7395db82848d8830981Craig Topperstatic __inline__ unsigned long long __attribute__((__always_inline__, __nodebug__)) 56f58f3647b19c40455065c7395db82848d8830981Craig Topper_bzhi_u64(unsigned long long __X, unsigned long long __Y) 57f58f3647b19c40455065c7395db82848d8830981Craig Topper{ 58f58f3647b19c40455065c7395db82848d8830981Craig Topper return __builtin_ia32_bzhi_di(__X, __Y); 59f58f3647b19c40455065c7395db82848d8830981Craig Topper} 60f58f3647b19c40455065c7395db82848d8830981Craig Topper 61f58f3647b19c40455065c7395db82848d8830981Craig Topperstatic __inline__ unsigned long long __attribute__((__always_inline__, __nodebug__)) 62f58f3647b19c40455065c7395db82848d8830981Craig Topper_pdep_u64(unsigned long long __X, unsigned long long __Y) 63f58f3647b19c40455065c7395db82848d8830981Craig Topper{ 64f58f3647b19c40455065c7395db82848d8830981Craig Topper return __builtin_ia32_pdep_di(__X, __Y); 65f58f3647b19c40455065c7395db82848d8830981Craig Topper} 66f58f3647b19c40455065c7395db82848d8830981Craig Topper 67f58f3647b19c40455065c7395db82848d8830981Craig Topperstatic __inline__ unsigned long long __attribute__((__always_inline__, __nodebug__)) 68f58f3647b19c40455065c7395db82848d8830981Craig Topper_pext_u64(unsigned long long __X, unsigned long long __Y) 69f58f3647b19c40455065c7395db82848d8830981Craig Topper{ 70f58f3647b19c40455065c7395db82848d8830981Craig Topper return __builtin_ia32_pext_di(__X, __Y); 71f58f3647b19c40455065c7395db82848d8830981Craig Topper} 72f58f3647b19c40455065c7395db82848d8830981Craig Topper 734d1499dbfb8b6ebf893ec51a3016d3409706d647Michael Liaostatic __inline__ unsigned long long __attribute__((__always_inline__, __nodebug__)) 744d1499dbfb8b6ebf893ec51a3016d3409706d647Michael Liao_mulx_u64 (unsigned long long __X, unsigned long long __Y, 754d1499dbfb8b6ebf893ec51a3016d3409706d647Michael Liao unsigned long long *__P) 764d1499dbfb8b6ebf893ec51a3016d3409706d647Michael Liao{ 774d1499dbfb8b6ebf893ec51a3016d3409706d647Michael Liao unsigned __int128 __res = (unsigned __int128) __X * __Y; 784d1499dbfb8b6ebf893ec51a3016d3409706d647Michael Liao *__P = (unsigned long long) (__res >> 64); 794d1499dbfb8b6ebf893ec51a3016d3409706d647Michael Liao return (unsigned long long) __res; 804d1499dbfb8b6ebf893ec51a3016d3409706d647Michael Liao} 814d1499dbfb8b6ebf893ec51a3016d3409706d647Michael Liao 824d1499dbfb8b6ebf893ec51a3016d3409706d647Michael Liao#else /* !__x86_64__ */ 834d1499dbfb8b6ebf893ec51a3016d3409706d647Michael Liao 844d1499dbfb8b6ebf893ec51a3016d3409706d647Michael Liaostatic __inline__ unsigned int __attribute__((__always_inline__, __nodebug__)) 854d1499dbfb8b6ebf893ec51a3016d3409706d647Michael Liao_mulx_u32 (unsigned int __X, unsigned int __Y, unsigned int *__P) 864d1499dbfb8b6ebf893ec51a3016d3409706d647Michael Liao{ 874d1499dbfb8b6ebf893ec51a3016d3409706d647Michael Liao unsigned long long __res = (unsigned long long) __X * __Y; 884d1499dbfb8b6ebf893ec51a3016d3409706d647Michael Liao *__P = (unsigned int) (__res >> 32); 894d1499dbfb8b6ebf893ec51a3016d3409706d647Michael Liao return (unsigned int) __res; 904d1499dbfb8b6ebf893ec51a3016d3409706d647Michael Liao} 914d1499dbfb8b6ebf893ec51a3016d3409706d647Michael Liao 92f58f3647b19c40455065c7395db82848d8830981Craig Topper#endif /* !__x86_64__ */ 93f58f3647b19c40455065c7395db82848d8830981Craig Topper 94f58f3647b19c40455065c7395db82848d8830981Craig Topper#endif /* __BMI2INTRIN_H */ 95