Home | History | Annotate | Line # | Download | only in i386
ia32intrin.h revision 1.10
      1  1.10  mrg /* Copyright (C) 2009-2018 Free Software Foundation, Inc.
      2   1.1  mrg 
      3   1.1  mrg    This file is part of GCC.
      4   1.1  mrg 
      5   1.1  mrg    GCC is free software; you can redistribute it and/or modify
      6   1.1  mrg    it under the terms of the GNU General Public License as published by
      7   1.1  mrg    the Free Software Foundation; either version 3, or (at your option)
      8   1.1  mrg    any later version.
      9   1.1  mrg 
     10   1.1  mrg    GCC is distributed in the hope that it will be useful,
     11   1.1  mrg    but WITHOUT ANY WARRANTY; without even the implied warranty of
     12   1.1  mrg    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
     13   1.1  mrg    GNU General Public License for more details.
     14   1.1  mrg 
     15   1.1  mrg    Under Section 7 of GPL version 3, you are granted additional
     16   1.1  mrg    permissions described in the GCC Runtime Library Exception, version
     17   1.1  mrg    3.1, as published by the Free Software Foundation.
     18   1.1  mrg 
     19   1.1  mrg    You should have received a copy of the GNU General Public License and
     20   1.1  mrg    a copy of the GCC Runtime Library Exception along with this program;
     21   1.1  mrg    see the files COPYING3 and COPYING.RUNTIME respectively.  If not, see
     22   1.1  mrg    <http://www.gnu.org/licenses/>.  */
     23   1.1  mrg 
     24   1.1  mrg #ifndef _X86INTRIN_H_INCLUDED
     25   1.1  mrg # error "Never use <ia32intrin.h> directly; include <x86intrin.h> instead."
     26   1.1  mrg #endif
     27   1.1  mrg 
     28   1.1  mrg /* 32bit bsf */
     29   1.1  mrg extern __inline int
     30   1.1  mrg __attribute__((__gnu_inline__, __always_inline__, __artificial__))
     31   1.1  mrg __bsfd (int __X)
     32   1.1  mrg {
     33   1.1  mrg   return __builtin_ctz (__X);
     34   1.1  mrg }
     35   1.1  mrg 
     36   1.1  mrg /* 32bit bsr */
     37   1.1  mrg extern __inline int
     38   1.1  mrg __attribute__((__gnu_inline__, __always_inline__, __artificial__))
     39   1.1  mrg __bsrd (int __X)
     40   1.1  mrg {
     41   1.1  mrg   return __builtin_ia32_bsrsi (__X);
     42   1.1  mrg }
     43   1.1  mrg 
     44   1.1  mrg /* 32bit bswap */
     45   1.1  mrg extern __inline int
     46   1.1  mrg __attribute__((__gnu_inline__, __always_inline__, __artificial__))
     47   1.1  mrg __bswapd (int __X)
     48   1.1  mrg {
     49   1.1  mrg   return __builtin_bswap32 (__X);
     50   1.1  mrg }
     51   1.1  mrg 
     52   1.7  mrg #ifndef __iamcu__
     53   1.7  mrg 
     54   1.5  mrg #ifndef __SSE4_2__
     55   1.5  mrg #pragma GCC push_options
     56   1.5  mrg #pragma GCC target("sse4.2")
     57   1.5  mrg #define __DISABLE_SSE4_2__
     58   1.5  mrg #endif /* __SSE4_2__ */
     59   1.5  mrg 
     60   1.1  mrg /* 32bit accumulate CRC32 (polynomial 0x11EDC6F41) value.  */
     61   1.1  mrg extern __inline unsigned int
     62   1.1  mrg __attribute__((__gnu_inline__, __always_inline__, __artificial__))
     63   1.1  mrg __crc32b (unsigned int __C, unsigned char __V)
     64   1.1  mrg {
     65   1.1  mrg   return __builtin_ia32_crc32qi (__C, __V);
     66   1.1  mrg }
     67   1.1  mrg 
     68   1.1  mrg extern __inline unsigned int
     69   1.1  mrg __attribute__((__gnu_inline__, __always_inline__, __artificial__))
     70   1.1  mrg __crc32w (unsigned int __C, unsigned short __V)
     71   1.1  mrg {
     72   1.1  mrg   return __builtin_ia32_crc32hi (__C, __V);
     73   1.1  mrg }
     74   1.1  mrg 
     75   1.1  mrg extern __inline unsigned int
     76   1.1  mrg __attribute__((__gnu_inline__, __always_inline__, __artificial__))
     77   1.1  mrg __crc32d (unsigned int __C, unsigned int __V)
     78   1.1  mrg {
     79   1.1  mrg   return __builtin_ia32_crc32si (__C, __V);
     80   1.1  mrg }
     81   1.5  mrg 
     82   1.5  mrg #ifdef __DISABLE_SSE4_2__
     83   1.5  mrg #undef __DISABLE_SSE4_2__
     84   1.5  mrg #pragma GCC pop_options
     85   1.5  mrg #endif /* __DISABLE_SSE4_2__ */
     86   1.1  mrg 
     87   1.7  mrg #endif /* __iamcu__ */
     88   1.7  mrg 
     89   1.1  mrg /* 32bit popcnt */
     90   1.1  mrg extern __inline int
     91   1.1  mrg __attribute__((__gnu_inline__, __always_inline__, __artificial__))
     92   1.1  mrg __popcntd (unsigned int __X)
     93   1.1  mrg {
     94   1.1  mrg   return __builtin_popcount (__X);
     95   1.1  mrg }
     96   1.1  mrg 
     97   1.7  mrg #ifndef __iamcu__
     98   1.7  mrg 
     99   1.1  mrg /* rdpmc */
    100   1.1  mrg extern __inline unsigned long long
    101   1.1  mrg __attribute__((__gnu_inline__, __always_inline__, __artificial__))
    102   1.1  mrg __rdpmc (int __S)
    103   1.1  mrg {
    104   1.1  mrg   return __builtin_ia32_rdpmc (__S);
    105   1.1  mrg }
    106   1.1  mrg 
    107   1.7  mrg #endif /* __iamcu__ */
    108   1.7  mrg 
    109   1.1  mrg /* rdtsc */
    110   1.1  mrg extern __inline unsigned long long
    111   1.1  mrg __attribute__((__gnu_inline__, __always_inline__, __artificial__))
    112   1.1  mrg __rdtsc (void)
    113   1.1  mrg {
    114   1.1  mrg   return __builtin_ia32_rdtsc ();
    115   1.1  mrg }
    116   1.1  mrg 
    117   1.7  mrg #ifndef __iamcu__
    118   1.7  mrg 
    119   1.1  mrg /* rdtscp */
    120   1.1  mrg extern __inline unsigned long long
    121   1.1  mrg __attribute__((__gnu_inline__, __always_inline__, __artificial__))
    122   1.1  mrg __rdtscp (unsigned int *__A)
    123   1.1  mrg {
    124   1.1  mrg   return __builtin_ia32_rdtscp (__A);
    125   1.1  mrg }
    126   1.1  mrg 
    127   1.7  mrg #endif /* __iamcu__ */
    128   1.7  mrg 
    129   1.1  mrg /* 8bit rol */
    130   1.1  mrg extern __inline unsigned char
    131   1.1  mrg __attribute__((__gnu_inline__, __always_inline__, __artificial__))
    132   1.1  mrg __rolb (unsigned char __X, int __C)
    133   1.1  mrg {
    134   1.1  mrg   return __builtin_ia32_rolqi (__X, __C);
    135   1.1  mrg }
    136   1.1  mrg 
    137   1.1  mrg /* 16bit rol */
    138   1.1  mrg extern __inline unsigned short
    139   1.1  mrg __attribute__((__gnu_inline__, __always_inline__, __artificial__))
    140   1.1  mrg __rolw (unsigned short __X, int __C)
    141   1.1  mrg {
    142   1.1  mrg   return __builtin_ia32_rolhi (__X, __C);
    143   1.1  mrg }
    144   1.1  mrg 
    145   1.1  mrg /* 32bit rol */
    146   1.1  mrg extern __inline unsigned int
    147   1.1  mrg __attribute__((__gnu_inline__, __always_inline__, __artificial__))
    148   1.1  mrg __rold (unsigned int __X, int __C)
    149   1.1  mrg {
    150  1.10  mrg   __C &= 31;
    151  1.10  mrg   return (__X << __C) | (__X >> (-__C & 31));
    152   1.1  mrg }
    153   1.1  mrg 
    154   1.1  mrg /* 8bit ror */
    155   1.1  mrg extern __inline unsigned char
    156   1.1  mrg __attribute__((__gnu_inline__, __always_inline__, __artificial__))
    157   1.1  mrg __rorb (unsigned char __X, int __C)
    158   1.1  mrg {
    159   1.1  mrg   return __builtin_ia32_rorqi (__X, __C);
    160   1.1  mrg }
    161   1.1  mrg 
    162   1.1  mrg /* 16bit ror */
    163   1.1  mrg extern __inline unsigned short
    164   1.1  mrg __attribute__((__gnu_inline__, __always_inline__, __artificial__))
    165   1.1  mrg __rorw (unsigned short __X, int __C)
    166   1.1  mrg {
    167   1.1  mrg   return __builtin_ia32_rorhi (__X, __C);
    168   1.1  mrg }
    169   1.1  mrg 
    170   1.1  mrg /* 32bit ror */
    171   1.1  mrg extern __inline unsigned int
    172   1.1  mrg __attribute__((__gnu_inline__, __always_inline__, __artificial__))
    173   1.1  mrg __rord (unsigned int __X, int __C)
    174   1.1  mrg {
    175  1.10  mrg   __C &= 31;
    176  1.10  mrg   return (__X >> __C) | (__X << (-__C & 31));
    177   1.1  mrg }
    178   1.1  mrg 
    179   1.3  mrg /* Pause */
    180   1.3  mrg extern __inline void
    181   1.3  mrg __attribute__((__gnu_inline__, __always_inline__, __artificial__))
    182   1.3  mrg __pause (void)
    183   1.3  mrg {
    184   1.3  mrg   __builtin_ia32_pause ();
    185   1.3  mrg }
    186   1.3  mrg 
    187   1.1  mrg #ifdef __x86_64__
    188   1.1  mrg /* 64bit bsf */
    189   1.1  mrg extern __inline int
    190   1.1  mrg __attribute__((__gnu_inline__, __always_inline__, __artificial__))
    191   1.1  mrg __bsfq (long long __X)
    192   1.1  mrg {
    193   1.1  mrg   return __builtin_ctzll (__X);
    194   1.1  mrg }
    195   1.1  mrg 
    196   1.1  mrg /* 64bit bsr */
    197   1.1  mrg extern __inline int
    198   1.1  mrg __attribute__((__gnu_inline__, __always_inline__, __artificial__))
    199   1.1  mrg __bsrq (long long __X)
    200   1.1  mrg {
    201   1.1  mrg   return __builtin_ia32_bsrdi (__X);
    202   1.1  mrg }
    203   1.1  mrg 
    204   1.1  mrg /* 64bit bswap */
    205   1.1  mrg extern __inline long long
    206   1.1  mrg __attribute__((__gnu_inline__, __always_inline__, __artificial__))
    207   1.1  mrg __bswapq (long long __X)
    208   1.1  mrg {
    209   1.1  mrg   return __builtin_bswap64 (__X);
    210   1.1  mrg }
    211   1.1  mrg 
    212   1.5  mrg #ifndef __SSE4_2__
    213   1.5  mrg #pragma GCC push_options
    214   1.5  mrg #pragma GCC target("sse4.2")
    215   1.5  mrg #define __DISABLE_SSE4_2__
    216   1.5  mrg #endif /* __SSE4_2__ */
    217   1.5  mrg 
    218   1.1  mrg /* 64bit accumulate CRC32 (polynomial 0x11EDC6F41) value.  */
    219   1.1  mrg extern __inline unsigned long long
    220   1.1  mrg __attribute__((__gnu_inline__, __always_inline__, __artificial__))
    221   1.1  mrg __crc32q (unsigned long long __C, unsigned long long __V)
    222   1.1  mrg {
    223   1.1  mrg   return __builtin_ia32_crc32di (__C, __V);
    224   1.1  mrg }
    225   1.5  mrg 
    226   1.5  mrg #ifdef __DISABLE_SSE4_2__
    227   1.5  mrg #undef __DISABLE_SSE4_2__
    228   1.5  mrg #pragma GCC pop_options
    229   1.5  mrg #endif /* __DISABLE_SSE4_2__ */
    230   1.1  mrg 
    231   1.1  mrg /* 64bit popcnt */
    232   1.1  mrg extern __inline long long
    233   1.1  mrg __attribute__((__gnu_inline__, __always_inline__, __artificial__))
    234   1.1  mrg __popcntq (unsigned long long __X)
    235   1.1  mrg {
    236   1.1  mrg   return __builtin_popcountll (__X);
    237   1.1  mrg }
    238   1.1  mrg 
    239   1.1  mrg /* 64bit rol */
    240   1.1  mrg extern __inline unsigned long long
    241   1.1  mrg __attribute__((__gnu_inline__, __always_inline__, __artificial__))
    242   1.1  mrg __rolq (unsigned long long __X, int __C)
    243   1.1  mrg {
    244  1.10  mrg   __C &= 63;
    245  1.10  mrg   return (__X << __C) | (__X >> (-__C & 63));
    246   1.1  mrg }
    247   1.1  mrg 
    248   1.1  mrg /* 64bit ror */
    249   1.1  mrg extern __inline unsigned long long
    250   1.1  mrg __attribute__((__gnu_inline__, __always_inline__, __artificial__))
    251   1.1  mrg __rorq (unsigned long long __X, int __C)
    252   1.1  mrg {
    253  1.10  mrg   __C &= 63;
    254  1.10  mrg   return (__X >> __C) | (__X << (-__C & 63));
    255   1.1  mrg }
    256   1.1  mrg 
    257   1.5  mrg /* Read flags register */
    258   1.5  mrg extern __inline unsigned long long
    259   1.5  mrg __attribute__((__gnu_inline__, __always_inline__, __artificial__))
    260   1.5  mrg __readeflags (void)
    261   1.5  mrg {
    262   1.5  mrg   return __builtin_ia32_readeflags_u64 ();
    263   1.5  mrg }
    264   1.5  mrg 
    265   1.5  mrg /* Write flags register */
    266   1.5  mrg extern __inline void
    267   1.5  mrg __attribute__((__gnu_inline__, __always_inline__, __artificial__))
    268   1.6  mrg __writeeflags (unsigned long long __X)
    269   1.5  mrg {
    270   1.6  mrg   __builtin_ia32_writeeflags_u64 (__X);
    271   1.5  mrg }
    272   1.5  mrg 
    273   1.1  mrg #define _bswap64(a)		__bswapq(a)
    274   1.1  mrg #define _popcnt64(a)		__popcntq(a)
    275   1.5  mrg #else
    276   1.5  mrg 
    277   1.5  mrg /* Read flags register */
    278   1.5  mrg extern __inline unsigned int
    279   1.5  mrg __attribute__((__gnu_inline__, __always_inline__, __artificial__))
    280   1.5  mrg __readeflags (void)
    281   1.5  mrg {
    282   1.5  mrg   return __builtin_ia32_readeflags_u32 ();
    283   1.5  mrg }
    284   1.5  mrg 
    285   1.5  mrg /* Write flags register */
    286   1.5  mrg extern __inline void
    287   1.5  mrg __attribute__((__gnu_inline__, __always_inline__, __artificial__))
    288   1.6  mrg __writeeflags (unsigned int __X)
    289   1.5  mrg {
    290   1.6  mrg   __builtin_ia32_writeeflags_u32 (__X);
    291   1.5  mrg }
    292   1.5  mrg 
    293   1.5  mrg #endif
    294   1.5  mrg 
    295   1.5  mrg /* On LP64 systems, longs are 64-bit.  Use the appropriate rotate
    296   1.5  mrg  * function.  */
    297   1.5  mrg #ifdef __LP64__
    298   1.1  mrg #define _lrotl(a,b)		__rolq((a), (b))
    299   1.1  mrg #define _lrotr(a,b)		__rorq((a), (b))
    300   1.1  mrg #else
    301   1.1  mrg #define _lrotl(a,b)		__rold((a), (b))
    302   1.1  mrg #define _lrotr(a,b)		__rord((a), (b))
    303   1.1  mrg #endif
    304   1.1  mrg 
    305   1.1  mrg #define _bit_scan_forward(a)	__bsfd(a)
    306   1.1  mrg #define _bit_scan_reverse(a)	__bsrd(a)
    307   1.1  mrg #define _bswap(a)		__bswapd(a)
    308   1.1  mrg #define _popcnt32(a)		__popcntd(a)
    309   1.7  mrg #ifndef __iamcu__
    310   1.1  mrg #define _rdpmc(a)		__rdpmc(a)
    311   1.7  mrg #define _rdtscp(a)		__rdtscp(a)
    312   1.7  mrg #endif /* __iamcu__ */
    313   1.1  mrg #define _rdtsc()		__rdtsc()
    314   1.1  mrg #define _rotwl(a,b)		__rolw((a), (b))
    315   1.1  mrg #define _rotwr(a,b)		__rorw((a), (b))
    316   1.1  mrg #define _rotl(a,b)		__rold((a), (b))
    317   1.1  mrg #define _rotr(a,b)		__rord((a), (b))
    318