1 /* Copyright (C) 2013-2018 Free Software Foundation, Inc. 2 3 This file is part of GCC. 4 5 GCC is free software; you can redistribute it and/or modify 6 it under the terms of the GNU General Public License as published by 7 the Free Software Foundation; either version 3, or (at your option) 8 any later version. 9 10 GCC is distributed in the hope that it will be useful, 11 but WITHOUT ANY WARRANTY; without even the implied warranty of 12 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 13 GNU General Public License for more details. 14 15 Under Section 7 of GPL version 3, you are granted additional 16 permissions described in the GCC Runtime Library Exception, version 17 3.1, as published by the Free Software Foundation. 18 19 You should have received a copy of the GNU General Public License and 20 a copy of the GCC Runtime Library Exception along with this program; 21 see the files COPYING3 and COPYING.RUNTIME respectively. If not, see 22 <http://www.gnu.org/licenses/>. */ 23 24 #ifndef _IMMINTRIN_H_INCLUDED 25 #error "Never use <avx512pfintrin.h> directly; include <immintrin.h> instead." 26 #endif 27 28 #ifndef _AVX512PFINTRIN_H_INCLUDED 29 #define _AVX512PFINTRIN_H_INCLUDED 30 31 #ifndef __AVX512PF__ 32 #pragma GCC push_options 33 #pragma GCC target("avx512pf") 34 #define __DISABLE_AVX512PF__ 35 #endif /* __AVX512PF__ */ 36 37 /* Internal data types for implementing the intrinsics. */ 38 typedef long long __v8di __attribute__ ((__vector_size__ (64))); 39 typedef int __v16si __attribute__ ((__vector_size__ (64))); 40 41 /* The Intel API is flexible enough that we must allow aliasing with other 42 vector types, and their scalar components. */ 43 typedef long long __m512i __attribute__ ((__vector_size__ (64), __may_alias__)); 44 45 typedef unsigned char __mmask8; 46 typedef unsigned short __mmask16; 47 48 #ifdef __OPTIMIZE__ 49 extern __inline void 50 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__)) 51 _mm512_prefetch_i32gather_pd (__m256i __index, void const *__addr, 52 int __scale, int __hint) 53 { 54 __builtin_ia32_gatherpfdpd ((__mmask8) 0xFF, (__v8si) __index, __addr, 55 __scale, __hint); 56 } 57 58 extern __inline void 59 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__)) 60 _mm512_prefetch_i32gather_ps (__m512i __index, void const *__addr, 61 int __scale, int __hint) 62 { 63 __builtin_ia32_gatherpfdps ((__mmask16) 0xFFFF, (__v16si) __index, __addr, 64 __scale, __hint); 65 } 66 67 extern __inline void 68 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__)) 69 _mm512_mask_prefetch_i32gather_pd (__m256i __index, __mmask8 __mask, 70 void const *__addr, int __scale, int __hint) 71 { 72 __builtin_ia32_gatherpfdpd (__mask, (__v8si) __index, __addr, __scale, 73 __hint); 74 } 75 76 extern __inline void 77 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__)) 78 _mm512_mask_prefetch_i32gather_ps (__m512i __index, __mmask16 __mask, 79 void const *__addr, int __scale, int __hint) 80 { 81 __builtin_ia32_gatherpfdps (__mask, (__v16si) __index, __addr, __scale, 82 __hint); 83 } 84 85 extern __inline void 86 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__)) 87 _mm512_prefetch_i64gather_pd (__m512i __index, void const *__addr, 88 int __scale, int __hint) 89 { 90 __builtin_ia32_gatherpfqpd ((__mmask8) 0xFF, (__v8di) __index, __addr, 91 __scale, __hint); 92 } 93 94 extern __inline void 95 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__)) 96 _mm512_prefetch_i64gather_ps (__m512i __index, void const *__addr, 97 int __scale, int __hint) 98 { 99 __builtin_ia32_gatherpfqps ((__mmask8) 0xFF, (__v8di) __index, __addr, 100 __scale, __hint); 101 } 102 103 extern __inline void 104 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__)) 105 _mm512_mask_prefetch_i64gather_pd (__m512i __index, __mmask8 __mask, 106 void const *__addr, int __scale, int __hint) 107 { 108 __builtin_ia32_gatherpfqpd (__mask, (__v8di) __index, __addr, __scale, 109 __hint); 110 } 111 112 extern __inline void 113 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__)) 114 _mm512_mask_prefetch_i64gather_ps (__m512i __index, __mmask8 __mask, 115 void const *__addr, int __scale, int __hint) 116 { 117 __builtin_ia32_gatherpfqps (__mask, (__v8di) __index, __addr, __scale, 118 __hint); 119 } 120 121 extern __inline void 122 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__)) 123 _mm512_prefetch_i32scatter_pd (void *__addr, __m256i __index, int __scale, 124 int __hint) 125 { 126 __builtin_ia32_scatterpfdpd ((__mmask8) 0xFF, (__v8si) __index, __addr, 127 __scale, __hint); 128 } 129 130 extern __inline void 131 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__)) 132 _mm512_prefetch_i32scatter_ps (void *__addr, __m512i __index, int __scale, 133 int __hint) 134 { 135 __builtin_ia32_scatterpfdps ((__mmask16) 0xFFFF, (__v16si) __index, __addr, 136 __scale, __hint); 137 } 138 139 extern __inline void 140 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__)) 141 _mm512_mask_prefetch_i32scatter_pd (void *__addr, __mmask8 __mask, 142 __m256i __index, int __scale, int __hint) 143 { 144 __builtin_ia32_scatterpfdpd (__mask, (__v8si) __index, __addr, __scale, 145 __hint); 146 } 147 148 extern __inline void 149 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__)) 150 _mm512_mask_prefetch_i32scatter_ps (void *__addr, __mmask16 __mask, 151 __m512i __index, int __scale, int __hint) 152 { 153 __builtin_ia32_scatterpfdps (__mask, (__v16si) __index, __addr, __scale, 154 __hint); 155 } 156 157 extern __inline void 158 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__)) 159 _mm512_prefetch_i64scatter_pd (void *__addr, __m512i __index, int __scale, 160 int __hint) 161 { 162 __builtin_ia32_scatterpfqpd ((__mmask8) 0xFF, (__v8di) __index,__addr, 163 __scale, __hint); 164 } 165 166 extern __inline void 167 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__)) 168 _mm512_prefetch_i64scatter_ps (void *__addr, __m512i __index, int __scale, 169 int __hint) 170 { 171 __builtin_ia32_scatterpfqps ((__mmask8) 0xFF, (__v8di) __index, __addr, 172 __scale, __hint); 173 } 174 175 extern __inline void 176 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__)) 177 _mm512_mask_prefetch_i64scatter_pd (void *__addr, __mmask16 __mask, 178 __m512i __index, int __scale, int __hint) 179 { 180 __builtin_ia32_scatterpfqpd (__mask, (__v8di) __index, __addr, __scale, 181 __hint); 182 } 183 184 extern __inline void 185 __attribute__ ((__gnu_inline__, __always_inline__, __artificial__)) 186 _mm512_mask_prefetch_i64scatter_ps (void *__addr, __mmask16 __mask, 187 __m512i __index, int __scale, int __hint) 188 { 189 __builtin_ia32_scatterpfqps (__mask, (__v8di) __index, __addr, __scale, 190 __hint); 191 } 192 193 #else 194 #define _mm512_prefetch_i32gather_pd(INDEX, ADDR, SCALE, HINT) \ 195 __builtin_ia32_gatherpfdpd ((__mmask8)0xFF, (__v8si)(__m256i)INDEX, \ 196 (void const *)ADDR, (int)SCALE, (int)HINT) 197 198 #define _mm512_prefetch_i32gather_ps(INDEX, ADDR, SCALE, HINT) \ 199 __builtin_ia32_gatherpfdps ((__mmask16)0xFFFF, (__v16si)(__m512i)INDEX, \ 200 (void const *)ADDR, (int)SCALE, (int)HINT) 201 202 #define _mm512_mask_prefetch_i32gather_pd(INDEX, MASK, ADDR, SCALE, HINT) \ 203 __builtin_ia32_gatherpfdpd ((__mmask8)MASK, (__v8si)(__m256i)INDEX, \ 204 (void const *)ADDR, (int)SCALE, (int)HINT) 205 206 #define _mm512_mask_prefetch_i32gather_ps(INDEX, MASK, ADDR, SCALE, HINT) \ 207 __builtin_ia32_gatherpfdps ((__mmask16)MASK, (__v16si)(__m512i)INDEX, \ 208 (void const *)ADDR, (int)SCALE, (int)HINT) 209 210 #define _mm512_prefetch_i64gather_pd(INDEX, ADDR, SCALE, HINT) \ 211 __builtin_ia32_gatherpfqpd ((__mmask8)0xFF, (__v8di)(__m512i)INDEX, \ 212 (void *)ADDR, (int)SCALE, (int)HINT) 213 214 #define _mm512_prefetch_i64gather_ps(INDEX, ADDR, SCALE, HINT) \ 215 __builtin_ia32_gatherpfqps ((__mmask8)0xFF, (__v8di)(__m512i)INDEX, \ 216 (void *)ADDR, (int)SCALE, (int)HINT) 217 218 #define _mm512_mask_prefetch_i64gather_pd(INDEX, MASK, ADDR, SCALE, HINT) \ 219 __builtin_ia32_gatherpfqpd ((__mmask8)MASK, (__v8di)(__m512i)INDEX, \ 220 (void *)ADDR, (int)SCALE, (int)HINT) 221 222 #define _mm512_mask_prefetch_i64gather_ps(INDEX, MASK, ADDR, SCALE, HINT) \ 223 __builtin_ia32_gatherpfqps ((__mmask8)MASK, (__v8di)(__m512i)INDEX, \ 224 (void *)ADDR, (int)SCALE, (int)HINT) 225 226 #define _mm512_prefetch_i32scatter_pd(ADDR, INDEX, SCALE, HINT) \ 227 __builtin_ia32_scatterpfdpd ((__mmask8)0xFF, (__v8si)(__m256i)INDEX, \ 228 (void *)ADDR, (int)SCALE, (int)HINT) 229 230 #define _mm512_prefetch_i32scatter_ps(ADDR, INDEX, SCALE, HINT) \ 231 __builtin_ia32_scatterpfdps ((__mmask16)0xFFFF, (__v16si)(__m512i)INDEX, \ 232 (void *)ADDR, (int)SCALE, (int)HINT) 233 234 #define _mm512_mask_prefetch_i32scatter_pd(ADDR, MASK, INDEX, SCALE, HINT) \ 235 __builtin_ia32_scatterpfdpd ((__mmask8)MASK, (__v8si)(__m256i)INDEX, \ 236 (void *)ADDR, (int)SCALE, (int)HINT) 237 238 #define _mm512_mask_prefetch_i32scatter_ps(ADDR, MASK, INDEX, SCALE, HINT) \ 239 __builtin_ia32_scatterpfdps ((__mmask16)MASK, (__v16si)(__m512i)INDEX, \ 240 (void *)ADDR, (int)SCALE, (int)HINT) 241 242 #define _mm512_prefetch_i64scatter_pd(ADDR, INDEX, SCALE, HINT) \ 243 __builtin_ia32_scatterpfqpd ((__mmask8)0xFF, (__v8di)(__m512i)INDEX, \ 244 (void *)ADDR, (int)SCALE, (int)HINT) 245 246 #define _mm512_prefetch_i64scatter_ps(ADDR, INDEX, SCALE, HINT) \ 247 __builtin_ia32_scatterpfqps ((__mmask8)0xFF, (__v8di)(__m512i)INDEX, \ 248 (void *)ADDR, (int)SCALE, (int)HINT) 249 250 #define _mm512_mask_prefetch_i64scatter_pd(ADDR, MASK, INDEX, SCALE, HINT) \ 251 __builtin_ia32_scatterpfqpd ((__mmask8)MASK, (__v8di)(__m512i)INDEX, \ 252 (void *)ADDR, (int)SCALE, (int)HINT) 253 254 #define _mm512_mask_prefetch_i64scatter_ps(ADDR, MASK, INDEX, SCALE, HINT) \ 255 __builtin_ia32_scatterpfqps ((__mmask8)MASK, (__v8di)(__m512i)INDEX, \ 256 (void *)ADDR, (int)SCALE, (int)HINT) 257 #endif 258 259 #ifdef __DISABLE_AVX512PF__ 260 #undef __DISABLE_AVX512PF__ 261 #pragma GCC pop_options 262 #endif /* __DISABLE_AVX512PF__ */ 263 264 #endif /* _AVX512PFINTRIN_H_INCLUDED */ 265