Home | History | Annotate | Download | only in include
      1 /* Copyright (C) 2013-2014 Free Software Foundation, Inc.
      2 
      3    This file is part of GCC.
      4 
      5    GCC is free software; you can redistribute it and/or modify
      6    it under the terms of the GNU General Public License as published by
      7    the Free Software Foundation; either version 3, or (at your option)
      8    any later version.
      9 
     10    GCC is distributed in the hope that it will be useful,
     11    but WITHOUT ANY WARRANTY; without even the implied warranty of
     12    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
     13    GNU General Public License for more details.
     14 
     15    Under Section 7 of GPL version 3, you are granted additional
     16    permissions described in the GCC Runtime Library Exception, version
     17    3.1, as published by the Free Software Foundation.
     18 
     19    You should have received a copy of the GNU General Public License and
     20    a copy of the GCC Runtime Library Exception along with this program;
     21    see the files COPYING3 and COPYING.RUNTIME respectively.  If not, see
     22    <http://www.gnu.org/licenses/>.  */
     23 
     24 #ifndef _IMMINTRIN_H_INCLUDED
     25 #error "Never use <avx512pfintrin.h> directly; include <immintrin.h> instead."
     26 #endif
     27 
     28 #ifndef _AVX512PFINTRIN_H_INCLUDED
     29 #define _AVX512PFINTRIN_H_INCLUDED
     30 
     31 #ifndef __AVX512PF__
     32 #pragma GCC push_options
     33 #pragma GCC target("avx512pf")
     34 #define __DISABLE_AVX512PF__
     35 #endif /* __AVX512PF__ */
     36 
     37 /* Internal data types for implementing the intrinsics.  */
     38 typedef long long __v8di __attribute__ ((__vector_size__ (64)));
     39 typedef int __v16si __attribute__ ((__vector_size__ (64)));
     40 
     41 /* The Intel API is flexible enough that we must allow aliasing with other
     42    vector types, and their scalar components.  */
     43 typedef long long __m512i __attribute__ ((__vector_size__ (64), __may_alias__));
     44 
     45 typedef unsigned char  __mmask8;
     46 typedef unsigned short __mmask16;
     47 
     48 #ifdef __OPTIMIZE__
     49 extern __inline void
     50 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
     51 _mm512_mask_prefetch_i32gather_pd (__m256i index, __mmask8 mask,
     52 				   void *addr, int scale, int hint)
     53 {
     54   __builtin_ia32_gatherpfdpd (mask, (__v8si) index, (long long const *) addr,
     55 			      scale, hint);
     56 }
     57 
     58 extern __inline void
     59 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
     60 _mm512_mask_prefetch_i32gather_ps (__m512i index, __mmask16 mask,
     61 				   void *addr, int scale, int hint)
     62 {
     63   __builtin_ia32_gatherpfdps (mask, (__v16si) index, (int const *) addr,
     64 			      scale, hint);
     65 }
     66 
     67 extern __inline void
     68 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
     69 _mm512_mask_prefetch_i64gather_pd (__m512i index, __mmask8 mask,
     70 				   void *addr, int scale, int hint)
     71 {
     72   __builtin_ia32_gatherpfqpd (mask, (__v8di) index, (long long const *) addr,
     73 			      scale, hint);
     74 }
     75 
     76 extern __inline void
     77 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
     78 _mm512_mask_prefetch_i64gather_ps (__m512i index, __mmask8 mask,
     79 				   void *addr, int scale, int hint)
     80 {
     81   __builtin_ia32_gatherpfqps (mask, (__v8di) index, (int const *) addr,
     82 			      scale, hint);
     83 }
     84 
     85 extern __inline void
     86 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
     87 _mm512_prefetch_i32scatter_pd (void *addr, __m256i index, int scale,
     88 			       int hint)
     89 {
     90   __builtin_ia32_scatterpfdpd ((__mmask8) 0xFF, (__v8si) index,
     91 			       (long long const *)addr, scale, hint);
     92 }
     93 
     94 extern __inline void
     95 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
     96 _mm512_prefetch_i32scatter_ps (void *addr, __m512i index, int scale,
     97 			       int hint)
     98 {
     99   __builtin_ia32_scatterpfdps ((__mmask16) 0xFFFF, (__v16si) index, (int const *) addr,
    100 			       scale, hint);
    101 }
    102 
    103 extern __inline void
    104 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
    105 _mm512_mask_prefetch_i32scatter_pd (void *addr, __mmask8 mask,
    106 				    __m256i index, int scale, int hint)
    107 {
    108   __builtin_ia32_scatterpfdpd (mask, (__v8si) index, (long long const *) addr,
    109 			       scale, hint);
    110 }
    111 
    112 extern __inline void
    113 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
    114 _mm512_mask_prefetch_i32scatter_ps (void *addr, __mmask16 mask,
    115 				    __m512i index, int scale, int hint)
    116 {
    117   __builtin_ia32_scatterpfdps (mask, (__v16si) index, (int const *) addr,
    118 			       scale, hint);
    119 }
    120 
    121 extern __inline void
    122 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
    123 _mm512_prefetch_i64scatter_pd (void *addr, __m512i index, int scale,
    124 			       int hint)
    125 {
    126   __builtin_ia32_scatterpfqpd ((__mmask8) 0xFF, (__v8di) index, (long long const *) addr,
    127 			       scale, hint);
    128 }
    129 
    130 extern __inline void
    131 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
    132 _mm512_prefetch_i64scatter_ps (void *addr, __m512i index, int scale,
    133 			       int hint)
    134 {
    135   __builtin_ia32_scatterpfqps ((__mmask8) 0xFF, (__v8di) index, (int const *) addr,
    136 			       scale, hint);
    137 }
    138 
    139 extern __inline void
    140 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
    141 _mm512_mask_prefetch_i64scatter_pd (void *addr, __mmask16 mask,
    142 				    __m512i index, int scale, int hint)
    143 {
    144   __builtin_ia32_scatterpfqpd (mask, (__v8di) index, (long long const *) addr,
    145 			       scale, hint);
    146 }
    147 
    148 extern __inline void
    149 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
    150 _mm512_mask_prefetch_i64scatter_ps (void *addr, __mmask16 mask,
    151 				    __m512i index, int scale, int hint)
    152 {
    153   __builtin_ia32_scatterpfqps (mask, (__v8di) index, (int const *) addr,
    154 			       scale, hint);
    155 }
    156 
    157 #else
    158 #define _mm512_mask_prefetch_i32gather_pd(INDEX, MASK, ADDR, SCALE, HINT)    \
    159   __builtin_ia32_gatherpfdpd ((__mmask8)MASK, (__v8si)(__m256i)INDEX,	     \
    160 			      (long long const *)ADDR, (int)SCALE, (int)HINT)
    161 
    162 #define _mm512_mask_prefetch_i32gather_ps(INDEX, MASK, ADDR, SCALE, HINT)    \
    163   __builtin_ia32_gatherpfdps ((__mmask16)MASK, (__v16si)(__m512i)INDEX,      \
    164 			      (int const *)ADDR, (int)SCALE, (int)HINT)
    165 
    166 #define _mm512_mask_prefetch_i64gather_pd(INDEX, MASK, ADDR, SCALE, HINT)    \
    167   __builtin_ia32_gatherpfqpd ((__mmask8)MASK, (__v8di)(__m512i)INDEX,	     \
    168 			      (long long const *)ADDR, (int)SCALE, (int)HINT)
    169 
    170 #define _mm512_mask_prefetch_i64gather_ps(INDEX, MASK, ADDR, SCALE, HINT)    \
    171   __builtin_ia32_gatherpfqps ((__mmask8)MASK, (__v8di)(__m512i)INDEX,	     \
    172 			      (int const *)ADDR, (int)SCALE, (int)HINT)
    173 
    174 #define _mm512_prefetch_i32scatter_pd(ADDR, INDEX, SCALE, HINT)              \
    175   __builtin_ia32_scatterpfdpd ((__mmask8)0xFF, (__v8si)(__m256i)INDEX,       \
    176 			       (long long const *)ADDR, (int)SCALE, (int)HINT)
    177 
    178 #define _mm512_prefetch_i32scatter_ps(ADDR, INDEX, SCALE, HINT)              \
    179   __builtin_ia32_scatterpfdps ((__mmask16)0xFFFF, (__v16si)(__m512i)INDEX,   \
    180 			       (int const *)ADDR, (int)SCALE, (int)HINT)
    181 
    182 #define _mm512_mask_prefetch_i32scatter_pd(ADDR, MASK, INDEX, SCALE, HINT)   \
    183   __builtin_ia32_scatterpfdpd ((__mmask8)MASK, (__v8si)(__m256i)INDEX,       \
    184 			       (long long const *)ADDR, (int)SCALE, (int)HINT)
    185 
    186 #define _mm512_mask_prefetch_i32scatter_ps(ADDR, MASK, INDEX, SCALE, HINT)   \
    187   __builtin_ia32_scatterpfdps ((__mmask16)MASK, (__v16si)(__m512i)INDEX,     \
    188 			       (int const *)ADDR, (int)SCALE, (int)HINT)
    189 
    190 #define _mm512_prefetch_i64scatter_pd(ADDR, INDEX, SCALE, HINT)              \
    191   __builtin_ia32_scatterpfqpd ((__mmask8)0xFF, (__v8di)(__m512i)INDEX,	     \
    192 			       (long long const *)ADDR, (int)SCALE, (int)HINT)
    193 
    194 #define _mm512_prefetch_i64scatter_ps(ADDR, INDEX, SCALE, HINT)              \
    195   __builtin_ia32_scatterpfqps ((__mmask8)0xFF, (__v8di)(__m512i)INDEX,	     \
    196 			       (int const *)ADDR, (int)SCALE, (int)HINT)
    197 
    198 #define _mm512_mask_prefetch_i64scatter_pd(ADDR, MASK, INDEX, SCALE, HINT)   \
    199   __builtin_ia32_scatterpfqpd ((__mmask8)MASK, (__v8di)(__m512i)INDEX,	     \
    200 			       (long long const *)ADDR, (int)SCALE, (int)HINT)
    201 
    202 #define _mm512_mask_prefetch_i64scatter_ps(ADDR, MASK, INDEX, SCALE, HINT)   \
    203   __builtin_ia32_scatterpfqps ((__mmask8)MASK, (__v8di)(__m512i)INDEX,	     \
    204 			       (int const *)ADDR, (int)SCALE, (int)HINT)
    205 #endif
    206 
    207 #ifdef __DISABLE_AVX512PF__
    208 #undef __DISABLE_AVX512PF__
    209 #pragma GCC pop_options
    210 #endif /* __DISABLE_AVX512PF__ */
    211 
    212 #endif /* _AVX512PFINTRIN_H_INCLUDED */
    213