CBMC
gcc_builtin_headers_ia32-6.h
Go to the documentation of this file.
1 // clang-format off
2 // amx-fp16
3 void __builtin_ia32_tdpfp16ps(unsigned char, unsigned char, unsigned char);
4 __gcc_v256si __builtin_ia32_tdpfp16ps_internal(unsigned short, unsigned short, unsigned short, __gcc_v256si, __gcc_v256si, __gcc_v256si);
5 // avx
6 short __builtin_ia32_vec_ext_v16hi(__gcc_v16hi, int);
7 char __builtin_ia32_vec_ext_v32qi(__gcc_v32qi, int);
8 long long int __builtin_ia32_vec_ext_v4di(__gcc_v4di, int);
9 int __builtin_ia32_vec_ext_v8si(__gcc_v8si, int);
10 __gcc_v16hi __builtin_ia32_vec_set_v16hi(__gcc_v16hi, short, int);
11 __gcc_v32qi __builtin_ia32_vec_set_v32qi(__gcc_v32qi, char, int);
12 __gcc_v4di __builtin_ia32_vec_set_v4di(__gcc_v4di, long long int, int);
13 __gcc_v8si __builtin_ia32_vec_set_v8si(__gcc_v8si, int, int);
14 // avx2
15 __gcc_v4si __builtin_ia32_gatherd_d(__gcc_v4si, const int *, __gcc_v4si, __gcc_v4si, char);
16 __gcc_v8si __builtin_ia32_gatherd_d256(__gcc_v8si, const int *, __gcc_v8si, __gcc_v8si, char);
17 __gcc_v2df __builtin_ia32_gatherd_pd(__gcc_v2df, const double *, __gcc_v4si, __gcc_v2df, char);
18 __gcc_v4df __builtin_ia32_gatherd_pd256(__gcc_v4df, const double *, __gcc_v4si, __gcc_v4df, char);
19 __gcc_v4sf __builtin_ia32_gatherd_ps(__gcc_v4sf, const float *, __gcc_v4si, __gcc_v4sf, char);
20 __gcc_v8sf __builtin_ia32_gatherd_ps256(__gcc_v8sf, const float *, __gcc_v8si, __gcc_v8sf, char);
21 __gcc_v2di __builtin_ia32_gatherd_q(__gcc_v2di, const long long int *, __gcc_v4si, __gcc_v2di, char);
22 __gcc_v4di __builtin_ia32_gatherd_q256(__gcc_v4di, const long long int *, __gcc_v4si, __gcc_v4di, char);
23 __gcc_v4si __builtin_ia32_gatherq_d(__gcc_v4si, const int *, __gcc_v2di, __gcc_v4si, char);
24 __gcc_v4si __builtin_ia32_gatherq_d256(__gcc_v4si, const int *, __gcc_v4di, __gcc_v4si, char);
25 __gcc_v2df __builtin_ia32_gatherq_pd(__gcc_v2df, const double *, __gcc_v2di, __gcc_v2df, char);
26 __gcc_v4df __builtin_ia32_gatherq_pd256(__gcc_v4df, const double *, __gcc_v4di, __gcc_v4df, char);
27 __gcc_v4sf __builtin_ia32_gatherq_ps(__gcc_v4sf, const float *, __gcc_v2di, __gcc_v4sf, char);
28 __gcc_v4sf __builtin_ia32_gatherq_ps256(__gcc_v4sf, const float *, __gcc_v4di, __gcc_v4sf, char);
29 __gcc_v2di __builtin_ia32_gatherq_q(__gcc_v2di, const long long int *, __gcc_v2di, __gcc_v2di, char);
30 __gcc_v4di __builtin_ia32_gatherq_q256(__gcc_v4di, const long long int *, __gcc_v4di, __gcc_v4di, char);
31 __gcc_v4di __builtin_ia32_pslldqi256_byteshift(__gcc_v4di, int);
32 __gcc_v4di __builtin_ia32_psrldqi256_byteshift(__gcc_v4di, int);
33 // avx512bf16
34 __gcc_v32hf __builtin_ia32_selectpbf_512(unsigned int, __gcc_v32hf, __gcc_v32hf);
35 __gcc_v8hf __builtin_ia32_selectsbf_128(unsigned char, __gcc_v8hf, __gcc_v8hf);
36 // avx512bf16,avx512vl
37 __gcc_v8hf __builtin_ia32_selectpbf_128(unsigned char, __gcc_v8hf, __gcc_v8hf);
38 __gcc_v16hf __builtin_ia32_selectpbf_256(unsigned short, __gcc_v16hf, __gcc_v16hf);
39 // avx512bf16,avx512vl|avxneconvert
40 __gcc_v8hf __builtin_ia32_vcvtneps2bf16128(__gcc_v4sf);
41 __gcc_v8hf __builtin_ia32_vcvtneps2bf16256(__gcc_v8sf);
42 // avx512bitalg
43 __gcc_v64qi __builtin_ia32_vpopcntb_512(__gcc_v64qi);
44 __gcc_v32hi __builtin_ia32_vpopcntw_512(__gcc_v32hi);
45 // avx512bw
46 __gcc_v32hi __builtin_ia32_dbpsadbw512(__gcc_v64qi, __gcc_v64qi, int);
47 __gcc_v32hi __builtin_ia32_packssdw512(__gcc_v16si, __gcc_v16si);
48 __gcc_v64qi __builtin_ia32_packsswb512(__gcc_v32hi, __gcc_v32hi);
49 __gcc_v32hi __builtin_ia32_packusdw512(__gcc_v16si, __gcc_v16si);
50 __gcc_v64qi __builtin_ia32_packuswb512(__gcc_v32hi, __gcc_v32hi);
51 __gcc_v64qi __builtin_ia32_pavgb512(__gcc_v64qi, __gcc_v64qi);
52 __gcc_v32hi __builtin_ia32_pavgw512(__gcc_v32hi, __gcc_v32hi);
53 __gcc_v32hi __builtin_ia32_permvarhi512(__gcc_v32hi, __gcc_v32hi);
54 __gcc_v32hi __builtin_ia32_pmaddubsw512(__gcc_v64qi, __gcc_v64qi);
55 __gcc_v16si __builtin_ia32_pmaddwd512(__gcc_v32hi, __gcc_v32hi);
56 __gcc_v32hi __builtin_ia32_pmulhrsw512(__gcc_v32hi, __gcc_v32hi);
57 __gcc_v32hi __builtin_ia32_pmulhuw512(__gcc_v32hi, __gcc_v32hi);
58 __gcc_v32hi __builtin_ia32_pmulhw512(__gcc_v32hi, __gcc_v32hi);
59 __gcc_v64qi __builtin_ia32_pshufb512(__gcc_v64qi, __gcc_v64qi);
60 __gcc_v32hi __builtin_ia32_pshufhw512(__gcc_v32hi, int);
61 __gcc_v32hi __builtin_ia32_pshuflw512(__gcc_v32hi, int);
62 __gcc_v8di __builtin_ia32_pslldqi512_byteshift(__gcc_v8di, int);
63 __gcc_v32hi __builtin_ia32_psllv32hi(__gcc_v32hi, __gcc_v32hi);
64 __gcc_v32hi __builtin_ia32_psllw512(__gcc_v32hi, __gcc_v8hi);
65 __gcc_v32hi __builtin_ia32_psllwi512(__gcc_v32hi, int);
66 __gcc_v32hi __builtin_ia32_psrav32hi(__gcc_v32hi, __gcc_v32hi);
67 __gcc_v32hi __builtin_ia32_psraw512(__gcc_v32hi, __gcc_v8hi);
68 __gcc_v32hi __builtin_ia32_psrawi512(__gcc_v32hi, int);
69 __gcc_v8di __builtin_ia32_psrldqi512_byteshift(__gcc_v8di, int);
70 __gcc_v32hi __builtin_ia32_psrlv32hi(__gcc_v32hi, __gcc_v32hi);
71 __gcc_v32hi __builtin_ia32_psrlw512(__gcc_v32hi, __gcc_v8hi);
72 __gcc_v32hi __builtin_ia32_psrlwi512(__gcc_v32hi, int);
73 __gcc_v32hi __builtin_ia32_vpermi2varhi512(__gcc_v32hi, __gcc_v32hi, __gcc_v32hi);
74 // avx512bw,avx512vl
75 __gcc_v8hi __builtin_ia32_dbpsadbw128(__gcc_v16qi, __gcc_v16qi, int);
76 __gcc_v16hi __builtin_ia32_dbpsadbw256(__gcc_v32qi, __gcc_v32qi, int);
77 __gcc_v8hi __builtin_ia32_permvarhi128(__gcc_v8hi, __gcc_v8hi);
78 __gcc_v16hi __builtin_ia32_permvarhi256(__gcc_v16hi, __gcc_v16hi);
79 __gcc_v16hi __builtin_ia32_psllv16hi(__gcc_v16hi, __gcc_v16hi);
80 __gcc_v8hi __builtin_ia32_psllv8hi(__gcc_v8hi, __gcc_v8hi);
81 __gcc_v16hi __builtin_ia32_psrav16hi(__gcc_v16hi, __gcc_v16hi);
82 __gcc_v8hi __builtin_ia32_psrav8hi(__gcc_v8hi, __gcc_v8hi);
83 __gcc_v16hi __builtin_ia32_psrlv16hi(__gcc_v16hi, __gcc_v16hi);
84 __gcc_v8hi __builtin_ia32_psrlv8hi(__gcc_v8hi, __gcc_v8hi);
85 // avx512cd
86 __gcc_v8di __builtin_ia32_vpconflictdi_512(__gcc_v8di);
87 __gcc_v16si __builtin_ia32_vpconflictsi_512(__gcc_v16si);
88 __gcc_v16si __builtin_ia32_vplzcntd_512(__gcc_v16si);
89 __gcc_v8di __builtin_ia32_vplzcntq_512(__gcc_v8di);
90 // avx512cd,avx512vl
91 __gcc_v2di __builtin_ia32_vpconflictdi_128(__gcc_v2di);
92 __gcc_v4di __builtin_ia32_vpconflictdi_256(__gcc_v4di);
93 __gcc_v4si __builtin_ia32_vpconflictsi_128(__gcc_v4si);
94 __gcc_v8si __builtin_ia32_vpconflictsi_256(__gcc_v8si);
95 __gcc_v4si __builtin_ia32_vplzcntd_128(__gcc_v4si);
96 __gcc_v8si __builtin_ia32_vplzcntd_256(__gcc_v8si);
97 __gcc_v2di __builtin_ia32_vplzcntq_128(__gcc_v2di);
98 __gcc_v4di __builtin_ia32_vplzcntq_256(__gcc_v4di);
99 // avx512dq
100 __gcc_v16sf __builtin_ia32_insertf32x8(__gcc_v16sf, __gcc_v8sf, int);
101 __gcc_v8df __builtin_ia32_insertf64x2_512(__gcc_v8df, __gcc_v2df, int);
102 __gcc_v16si __builtin_ia32_inserti32x8(__gcc_v16si, __gcc_v8si, int);
103 __gcc_v8di __builtin_ia32_inserti64x2_512(__gcc_v8di, __gcc_v2di, int);
104 __gcc_v2df __builtin_ia32_rangesd128_round_mask(__gcc_v2df, __gcc_v2df, __gcc_v2df, unsigned char, int, int);
105 __gcc_v4sf __builtin_ia32_rangess128_round_mask(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int, int);
106 // avx512dq,avx512vl
107 __gcc_v4df __builtin_ia32_insertf64x2_256(__gcc_v4df, __gcc_v2df, int);
108 __gcc_v4di __builtin_ia32_inserti64x2_256(__gcc_v4di, __gcc_v2di, int);
109 // avx512er
110 __gcc_v2df __builtin_ia32_rcp28sd_round_mask(__gcc_v2df, __gcc_v2df, __gcc_v2df, unsigned char, int);
111 __gcc_v4sf __builtin_ia32_rcp28ss_round_mask(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int);
112 __gcc_v2df __builtin_ia32_rsqrt28sd_round_mask(__gcc_v2df, __gcc_v2df, __gcc_v2df, unsigned char, int);
113 __gcc_v4sf __builtin_ia32_rsqrt28ss_round_mask(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int);
114 // avx512f
115 __gcc_v8df __builtin_ia32_addpd512(__gcc_v8df, __gcc_v8df, int);
116 __gcc_v16sf __builtin_ia32_addps512(__gcc_v16sf, __gcc_v16sf, int);
117 __gcc_v2df __builtin_ia32_addsd_round_mask(__gcc_v2df, __gcc_v2df, __gcc_v2df, unsigned char, int);
118 __gcc_v4sf __builtin_ia32_addss_round_mask(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int);
119 __gcc_v16si __builtin_ia32_alignd512(__gcc_v16si, __gcc_v16si, int);
120 __gcc_v8di __builtin_ia32_alignq512(__gcc_v8di, __gcc_v8di, int);
121 __gcc_v8df __builtin_ia32_divpd512(__gcc_v8df, __gcc_v8df, int);
122 __gcc_v16sf __builtin_ia32_divps512(__gcc_v16sf, __gcc_v16sf, int);
123 __gcc_v2df __builtin_ia32_divsd_round_mask(__gcc_v2df, __gcc_v2df, __gcc_v2df, unsigned char, int);
124 __gcc_v4sf __builtin_ia32_divss_round_mask(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int);
125 __gcc_v2df __builtin_ia32_getexpsd128_round_mask(__gcc_v2df, __gcc_v2df, __gcc_v2df, unsigned char, int);
126 __gcc_v4sf __builtin_ia32_getexpss128_round_mask(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int);
127 __gcc_v2df __builtin_ia32_getmantsd_round_mask(__gcc_v2df, __gcc_v2df, int, __gcc_v2df, unsigned char, int);
128 __gcc_v4sf __builtin_ia32_getmantss_round_mask(__gcc_v4sf, __gcc_v4sf, int, __gcc_v4sf, unsigned char, int);
129 __gcc_v16sf __builtin_ia32_insertf32x4(__gcc_v16sf, __gcc_v4sf, int);
130 __gcc_v8df __builtin_ia32_insertf64x4(__gcc_v8df, __gcc_v4df, int);
131 __gcc_v16si __builtin_ia32_inserti32x4(__gcc_v16si, __gcc_v4si, int);
132 __gcc_v8di __builtin_ia32_inserti64x4(__gcc_v8di, __gcc_v4di, int);
133 __gcc_v2df __builtin_ia32_loadsd128_mask(const __gcc_v2df *, __gcc_v2df, unsigned char);
134 __gcc_v4sf __builtin_ia32_loadss128_mask(const __gcc_v4sf *, __gcc_v4sf, unsigned char);
135 __gcc_v8df __builtin_ia32_maxpd512(__gcc_v8df, __gcc_v8df, int);
136 __gcc_v16sf __builtin_ia32_maxps512(__gcc_v16sf, __gcc_v16sf, int);
137 __gcc_v2df __builtin_ia32_maxsd_round_mask(__gcc_v2df, __gcc_v2df, __gcc_v2df, unsigned char, int);
138 __gcc_v4sf __builtin_ia32_maxss_round_mask(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int);
139 __gcc_v8df __builtin_ia32_minpd512(__gcc_v8df, __gcc_v8df, int);
140 __gcc_v16sf __builtin_ia32_minps512(__gcc_v16sf, __gcc_v16sf, int);
141 __gcc_v2df __builtin_ia32_minsd_round_mask(__gcc_v2df, __gcc_v2df, __gcc_v2df, unsigned char, int);
142 __gcc_v4sf __builtin_ia32_minss_round_mask(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int);
143 __gcc_v8df __builtin_ia32_mulpd512(__gcc_v8df, __gcc_v8df, int);
144 __gcc_v16sf __builtin_ia32_mulps512(__gcc_v16sf, __gcc_v16sf, int);
145 __gcc_v2df __builtin_ia32_mulsd_round_mask(__gcc_v2df, __gcc_v2df, __gcc_v2df, unsigned char, int);
146 __gcc_v4sf __builtin_ia32_mulss_round_mask(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int);
147 __gcc_v8df __builtin_ia32_permdf512(__gcc_v8df, int);
148 __gcc_v8di __builtin_ia32_permdi512(__gcc_v8di, int);
149 __gcc_v8df __builtin_ia32_permvardf512(__gcc_v8df, __gcc_v8di);
150 __gcc_v8di __builtin_ia32_permvardi512(__gcc_v8di, __gcc_v8di);
151 __gcc_v16sf __builtin_ia32_permvarsf512(__gcc_v16sf, __gcc_v16si);
152 __gcc_v16si __builtin_ia32_permvarsi512(__gcc_v16si, __gcc_v16si);
153 __gcc_v8di __builtin_ia32_pmuldq512(__gcc_v16si, __gcc_v16si);
154 __gcc_v8di __builtin_ia32_pmuludq512(__gcc_v16si, __gcc_v16si);
155 __gcc_v16si __builtin_ia32_prold512(__gcc_v16si, int);
156 __gcc_v8di __builtin_ia32_prolq512(__gcc_v8di, int);
157 __gcc_v16si __builtin_ia32_prolvd512(__gcc_v16si, __gcc_v16si);
158 __gcc_v8di __builtin_ia32_prolvq512(__gcc_v8di, __gcc_v8di);
159 __gcc_v16si __builtin_ia32_prord512(__gcc_v16si, int);
160 __gcc_v8di __builtin_ia32_prorq512(__gcc_v8di, int);
161 __gcc_v16si __builtin_ia32_prorvd512(__gcc_v16si, __gcc_v16si);
162 __gcc_v8di __builtin_ia32_prorvq512(__gcc_v8di, __gcc_v8di);
163 __gcc_v16si __builtin_ia32_pshufd512(__gcc_v16si, int);
164 __gcc_v16si __builtin_ia32_pslld512(__gcc_v16si, __gcc_v4si);
165 __gcc_v16si __builtin_ia32_pslldi512(__gcc_v16si, int);
166 __gcc_v8di __builtin_ia32_psllq512(__gcc_v8di, __gcc_v2di);
167 __gcc_v8di __builtin_ia32_psllqi512(__gcc_v8di, int);
168 __gcc_v16si __builtin_ia32_psllv16si(__gcc_v16si, __gcc_v16si);
169 __gcc_v8di __builtin_ia32_psllv8di(__gcc_v8di, __gcc_v8di);
170 __gcc_v16si __builtin_ia32_psrad512(__gcc_v16si, __gcc_v4si);
171 __gcc_v16si __builtin_ia32_psradi512(__gcc_v16si, int);
172 __gcc_v8di __builtin_ia32_psraq512(__gcc_v8di, __gcc_v2di);
173 __gcc_v8di __builtin_ia32_psraqi512(__gcc_v8di, int);
174 __gcc_v16si __builtin_ia32_psrav16si(__gcc_v16si, __gcc_v16si);
175 __gcc_v8di __builtin_ia32_psrav8di(__gcc_v8di, __gcc_v8di);
176 __gcc_v16si __builtin_ia32_psrld512(__gcc_v16si, __gcc_v4si);
177 __gcc_v16si __builtin_ia32_psrldi512(__gcc_v16si, int);
178 __gcc_v8di __builtin_ia32_psrlq512(__gcc_v8di, __gcc_v2di);
179 __gcc_v8di __builtin_ia32_psrlqi512(__gcc_v8di, int);
180 __gcc_v16si __builtin_ia32_psrlv16si(__gcc_v16si, __gcc_v16si);
181 __gcc_v8di __builtin_ia32_psrlv8di(__gcc_v8di, __gcc_v8di);
182 double __builtin_ia32_reduce_fadd_pd512(double, __gcc_v8df);
183 float __builtin_ia32_reduce_fadd_ps512(float, __gcc_v16sf);
188 double __builtin_ia32_reduce_fmul_pd512(double, __gcc_v8df);
189 float __builtin_ia32_reduce_fmul_ps512(float, __gcc_v16sf);
190 __gcc_v2df __builtin_ia32_rndscalesd_round_mask(__gcc_v2df, __gcc_v2df, __gcc_v2df, unsigned char, int, int);
191 __gcc_v4sf __builtin_ia32_rndscaless_round_mask(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int, int);
192 __gcc_v2df __builtin_ia32_scalefsd_round_mask(__gcc_v2df, __gcc_v2df, __gcc_v2df, unsigned char, int);
193 __gcc_v4sf __builtin_ia32_scalefss_round_mask(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int);
194 __gcc_v8di __builtin_ia32_selectq_512(unsigned char, __gcc_v8di, __gcc_v8di);
195 __gcc_v16sf __builtin_ia32_shuf_f32x4(__gcc_v16sf, __gcc_v16sf, int);
196 __gcc_v8df __builtin_ia32_shuf_f64x2(__gcc_v8df, __gcc_v8df, int);
197 __gcc_v16si __builtin_ia32_shuf_i32x4(__gcc_v16si, __gcc_v16si, int);
198 __gcc_v8di __builtin_ia32_shuf_i64x2(__gcc_v8di, __gcc_v8di, int);
199 __gcc_v8df __builtin_ia32_shufpd512(__gcc_v8df, __gcc_v8df, int);
200 __gcc_v16sf __builtin_ia32_shufps512(__gcc_v16sf, __gcc_v16sf, int);
201 __gcc_v2df __builtin_ia32_sqrtsd_round_mask(__gcc_v2df, __gcc_v2df, __gcc_v2df, unsigned char, int);
202 __gcc_v4sf __builtin_ia32_sqrtss_round_mask(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int);
203 void __builtin_ia32_storesd128_mask(__gcc_v2df *, __gcc_v2df, unsigned char);
204 void __builtin_ia32_storess128_mask(__gcc_v4sf *, __gcc_v4sf, unsigned char);
205 __gcc_v8df __builtin_ia32_subpd512(__gcc_v8df, __gcc_v8df, int);
206 __gcc_v16sf __builtin_ia32_subps512(__gcc_v16sf, __gcc_v16sf, int);
207 __gcc_v2df __builtin_ia32_subsd_round_mask(__gcc_v2df, __gcc_v2df, __gcc_v2df, unsigned char, int);
208 __gcc_v4sf __builtin_ia32_subss_round_mask(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int);
209 __gcc_v16si __builtin_ia32_vpermi2vard512(__gcc_v16si, __gcc_v16si, __gcc_v16si);
210 __gcc_v8df __builtin_ia32_vpermi2varpd512(__gcc_v8df, __gcc_v8di, __gcc_v8df);
211 __gcc_v16sf __builtin_ia32_vpermi2varps512(__gcc_v16sf, __gcc_v16si, __gcc_v16sf);
212 __gcc_v8di __builtin_ia32_vpermi2varq512(__gcc_v8di, __gcc_v8di, __gcc_v8di);
213 __gcc_v8df __builtin_ia32_vpermilpd512(__gcc_v8df, int);
214 __gcc_v16sf __builtin_ia32_vpermilps512(__gcc_v16sf, int);
215 __gcc_v8df __builtin_ia32_vpermilvarpd512(__gcc_v8df, __gcc_v8di);
216 __gcc_v16sf __builtin_ia32_vpermilvarps512(__gcc_v16sf, __gcc_v16si);
217 // avx512f,vaes
218 __gcc_v8di __builtin_ia32_aesdec512(__gcc_v8di, __gcc_v8di);
219 __gcc_v8di __builtin_ia32_aesdeclast512(__gcc_v8di, __gcc_v8di);
220 __gcc_v8di __builtin_ia32_aesenc512(__gcc_v8di, __gcc_v8di);
221 __gcc_v8di __builtin_ia32_aesenclast512(__gcc_v8di, __gcc_v8di);
222 // avx512f,vpclmulqdq
223 __gcc_v8di __builtin_ia32_pclmulqdq512(__gcc_v8di, __gcc_v8di, char);
224 // avx512fp16
225 __gcc_v32hf __builtin_ia32_addph512(__gcc_v32hf, __gcc_v32hf, int);
226 __gcc_v8hf __builtin_ia32_addsh_round_mask(__gcc_v8hf, __gcc_v8hf, __gcc_v8hf, unsigned char, int);
227 unsigned int __builtin_ia32_cmpph512_mask(__gcc_v32hf, __gcc_v32hf, int, unsigned int, int);
228 unsigned char __builtin_ia32_cmpsh_mask(__gcc_v8hf, __gcc_v8hf, int, unsigned char, int);
229 __gcc_v32hf __builtin_ia32_divph512(__gcc_v32hf, __gcc_v32hf, int);
230 __gcc_v8hf __builtin_ia32_divsh_round_mask(__gcc_v8hf, __gcc_v8hf, __gcc_v8hf, unsigned char, int);
231 __gcc_v8hf __builtin_ia32_getexpsh128_round_mask(__gcc_v8hf, __gcc_v8hf, __gcc_v8hf, unsigned char, int);
232 __gcc_v8hf __builtin_ia32_getmantsh_round_mask(__gcc_v8hf, __gcc_v8hf, int, __gcc_v8hf, unsigned char, int);
233 __gcc_v8hf __builtin_ia32_loadsh128_mask(const __gcc_v8hf *, __gcc_v8hf, unsigned char);
234 __gcc_v32hf __builtin_ia32_maxph512(__gcc_v32hf, __gcc_v32hf, int);
235 __gcc_v8hf __builtin_ia32_maxsh_round_mask(__gcc_v8hf, __gcc_v8hf, __gcc_v8hf, unsigned char, int);
236 __gcc_v32hf __builtin_ia32_minph512(__gcc_v32hf, __gcc_v32hf, int);
237 __gcc_v8hf __builtin_ia32_minsh_round_mask(__gcc_v8hf, __gcc_v8hf, __gcc_v8hf, unsigned char, int);
238 __gcc_v32hf __builtin_ia32_mulph512(__gcc_v32hf, __gcc_v32hf, int);
239 __gcc_v8hf __builtin_ia32_mulsh_round_mask(__gcc_v8hf, __gcc_v8hf, __gcc_v8hf, unsigned char, int);
240 _Float16 __builtin_ia32_reduce_fadd_ph512(_Float16, __gcc_v32hf);
241 _Float16 __builtin_ia32_reduce_fmax_ph512(__gcc_v32hf);
242 _Float16 __builtin_ia32_reduce_fmin_ph512(__gcc_v32hf);
243 _Float16 __builtin_ia32_reduce_fmul_ph512(_Float16, __gcc_v32hf);
244 __gcc_v32hf __builtin_ia32_reduceph512_mask(__gcc_v32hf, int, __gcc_v32hf, unsigned int, int);
245 __gcc_v8hf __builtin_ia32_reducesh_mask(__gcc_v8hf, __gcc_v8hf, __gcc_v8hf, unsigned char, int, int);
246 __gcc_v32hf __builtin_ia32_rndscaleph_mask(__gcc_v32hf, int, __gcc_v32hf, unsigned int, int);
247 __gcc_v8hf __builtin_ia32_rndscalesh_round_mask(__gcc_v8hf, __gcc_v8hf, __gcc_v8hf, unsigned char, int, int);
248 __gcc_v32hf __builtin_ia32_scalefph512_mask(__gcc_v32hf, __gcc_v32hf, __gcc_v32hf, unsigned int, int);
249 __gcc_v8hf __builtin_ia32_scalefsh_round_mask(__gcc_v8hf, __gcc_v8hf, __gcc_v8hf, unsigned char, int);
250 __gcc_v32hf __builtin_ia32_selectph_512(unsigned int, __gcc_v32hf, __gcc_v32hf);
251 __gcc_v8hf __builtin_ia32_selectsh_128(unsigned char, __gcc_v8hf, __gcc_v8hf);
252 __gcc_v32hf __builtin_ia32_sqrtph512(__gcc_v32hf, int);
253 __gcc_v8hf __builtin_ia32_sqrtsh_round_mask(__gcc_v8hf, __gcc_v8hf, __gcc_v8hf, unsigned char, int);
254 void __builtin_ia32_storesh128_mask(__gcc_v8hf *, __gcc_v8hf, unsigned char);
255 __gcc_v32hf __builtin_ia32_subph512(__gcc_v32hf, __gcc_v32hf, int);
256 __gcc_v8hf __builtin_ia32_subsh_round_mask(__gcc_v8hf, __gcc_v8hf, __gcc_v8hf, unsigned char, int);
257 int __builtin_ia32_vcomish(__gcc_v8hf, __gcc_v8hf, int, int);
258 __gcc_v16hf __builtin_ia32_vcvtdq2ph512_mask(__gcc_v16si, __gcc_v16hf, unsigned short, int);
259 __gcc_v8hf __builtin_ia32_vcvtpd2ph512_mask(__gcc_v8df, __gcc_v8hf, unsigned char, int);
260 __gcc_v16si __builtin_ia32_vcvtph2dq512_mask(__gcc_v16hf, __gcc_v16si, unsigned short, int);
261 __gcc_v8df __builtin_ia32_vcvtph2pd512_mask(__gcc_v8hf, __gcc_v8df, unsigned char, int);
262 __gcc_v16sf __builtin_ia32_vcvtph2psx512_mask(__gcc_v16hf, __gcc_v16sf, unsigned short, int);
263 __gcc_v8di __builtin_ia32_vcvtph2qq512_mask(__gcc_v8hf, __gcc_v8di, unsigned char, int);
264 __gcc_v16usi __builtin_ia32_vcvtph2udq512_mask(__gcc_v16hf, __gcc_v16usi, unsigned short, int);
265 __gcc_v8udi __builtin_ia32_vcvtph2uqq512_mask(__gcc_v8hf, __gcc_v8udi, unsigned char, int);
266 __gcc_v32uhi __builtin_ia32_vcvtph2uw512_mask(__gcc_v32hf, __gcc_v32uhi, unsigned int, int);
267 __gcc_v32hi __builtin_ia32_vcvtph2w512_mask(__gcc_v32hf, __gcc_v32hi, unsigned int, int);
268 __gcc_v16hf __builtin_ia32_vcvtps2phx512_mask(__gcc_v16sf, __gcc_v16hf, unsigned short, int);
269 __gcc_v8hf __builtin_ia32_vcvtqq2ph512_mask(__gcc_v8di, __gcc_v8hf, unsigned char, int);
270 __gcc_v8hf __builtin_ia32_vcvtsd2sh_round_mask(__gcc_v8hf, __gcc_v2df, __gcc_v8hf, unsigned char, int);
271 __gcc_v2df __builtin_ia32_vcvtsh2sd_round_mask(__gcc_v2df, __gcc_v8hf, __gcc_v2df, unsigned char, int);
272 int __builtin_ia32_vcvtsh2si32(__gcc_v8hf, int);
273 long long int __builtin_ia32_vcvtsh2si64(__gcc_v8hf, int);
274 __gcc_v4sf __builtin_ia32_vcvtsh2ss_round_mask(__gcc_v4sf, __gcc_v8hf, __gcc_v4sf, unsigned char, int);
275 unsigned int __builtin_ia32_vcvtsh2usi32(__gcc_v8hf, int);
276 unsigned long long int __builtin_ia32_vcvtsh2usi64(__gcc_v8hf, int);
277 __gcc_v8hf __builtin_ia32_vcvtsi2sh(__gcc_v8hf, int, int);
278 __gcc_v8hf __builtin_ia32_vcvtsi642sh(__gcc_v8hf, long long int, int);
279 __gcc_v8hf __builtin_ia32_vcvtss2sh_round_mask(__gcc_v8hf, __gcc_v4sf, __gcc_v8hf, unsigned char, int);
280 __gcc_v16si __builtin_ia32_vcvttph2dq512_mask(__gcc_v16hf, __gcc_v16si, unsigned short, int);
281 __gcc_v8di __builtin_ia32_vcvttph2qq512_mask(__gcc_v8hf, __gcc_v8di, unsigned char, int);
282 __gcc_v16usi __builtin_ia32_vcvttph2udq512_mask(__gcc_v16hf, __gcc_v16usi, unsigned short, int);
283 __gcc_v8udi __builtin_ia32_vcvttph2uqq512_mask(__gcc_v8hf, __gcc_v8udi, unsigned char, int);
284 __gcc_v32uhi __builtin_ia32_vcvttph2uw512_mask(__gcc_v32hf, __gcc_v32uhi, unsigned int, int);
285 __gcc_v32hi __builtin_ia32_vcvttph2w512_mask(__gcc_v32hf, __gcc_v32hi, unsigned int, int);
286 int __builtin_ia32_vcvttsh2si32(__gcc_v8hf, int);
287 long long int __builtin_ia32_vcvttsh2si64(__gcc_v8hf, int);
288 unsigned int __builtin_ia32_vcvttsh2usi32(__gcc_v8hf, int);
289 unsigned long long int __builtin_ia32_vcvttsh2usi64(__gcc_v8hf, int);
290 __gcc_v16hf __builtin_ia32_vcvtudq2ph512_mask(__gcc_v16usi, __gcc_v16hf, unsigned short, int);
291 __gcc_v8hf __builtin_ia32_vcvtuqq2ph512_mask(__gcc_v8udi, __gcc_v8hf, unsigned char, int);
292 __gcc_v8hf __builtin_ia32_vcvtusi2sh(__gcc_v8hf, unsigned int, int);
293 __gcc_v8hf __builtin_ia32_vcvtusi642sh(__gcc_v8hf, unsigned long long int, int);
294 __gcc_v32hf __builtin_ia32_vcvtuw2ph512_mask(__gcc_v32uhi, __gcc_v32hf, unsigned int, int);
295 __gcc_v32hf __builtin_ia32_vcvtw2ph512_mask(__gcc_v32hi, __gcc_v32hf, unsigned int, int);
296 __gcc_v16sf __builtin_ia32_vfcmaddcph512_mask(__gcc_v16sf, __gcc_v16sf, __gcc_v16sf, unsigned short, int);
297 __gcc_v16sf __builtin_ia32_vfcmaddcph512_mask3(__gcc_v16sf, __gcc_v16sf, __gcc_v16sf, unsigned short, int);
298 __gcc_v16sf __builtin_ia32_vfcmaddcph512_maskz(__gcc_v16sf, __gcc_v16sf, __gcc_v16sf, unsigned short, int);
299 __gcc_v4sf __builtin_ia32_vfcmaddcsh_mask(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int);
300 __gcc_v4sf __builtin_ia32_vfcmaddcsh_maskz(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int);
301 __gcc_v4sf __builtin_ia32_vfcmaddcsh_round_mask(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int);
302 __gcc_v4sf __builtin_ia32_vfcmaddcsh_round_mask3(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int);
303 __gcc_v16sf __builtin_ia32_vfcmulcph512_mask(__gcc_v16sf, __gcc_v16sf, __gcc_v16sf, unsigned short, int);
304 __gcc_v4sf __builtin_ia32_vfcmulcsh_mask(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int);
305 __gcc_v16sf __builtin_ia32_vfmaddcph512_mask(__gcc_v16sf, __gcc_v16sf, __gcc_v16sf, unsigned short, int);
306 __gcc_v16sf __builtin_ia32_vfmaddcph512_mask3(__gcc_v16sf, __gcc_v16sf, __gcc_v16sf, unsigned short, int);
307 __gcc_v16sf __builtin_ia32_vfmaddcph512_maskz(__gcc_v16sf, __gcc_v16sf, __gcc_v16sf, unsigned short, int);
308 __gcc_v4sf __builtin_ia32_vfmaddcsh_mask(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int);
309 __gcc_v4sf __builtin_ia32_vfmaddcsh_maskz(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int);
310 __gcc_v4sf __builtin_ia32_vfmaddcsh_round_mask(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int);
311 __gcc_v4sf __builtin_ia32_vfmaddcsh_round_mask3(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int);
312 __gcc_v16sf __builtin_ia32_vfmulcph512_mask(__gcc_v16sf, __gcc_v16sf, __gcc_v16sf, unsigned short, int);
313 __gcc_v4sf __builtin_ia32_vfmulcsh_mask(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int);
314 // avx512fp16,avx512vl
315 unsigned char __builtin_ia32_cmpph128_mask(__gcc_v8hf, __gcc_v8hf, int, unsigned char);
316 unsigned short __builtin_ia32_cmpph256_mask(__gcc_v16hf, __gcc_v16hf, int, unsigned short);
317 __gcc_v8hf __builtin_ia32_maxph128(__gcc_v8hf, __gcc_v8hf);
318 __gcc_v16hf __builtin_ia32_maxph256(__gcc_v16hf, __gcc_v16hf);
319 __gcc_v8hf __builtin_ia32_minph128(__gcc_v8hf, __gcc_v8hf);
320 __gcc_v16hf __builtin_ia32_minph256(__gcc_v16hf, __gcc_v16hf);
321 _Float16 __builtin_ia32_reduce_fadd_ph128(_Float16, __gcc_v8hf);
322 _Float16 __builtin_ia32_reduce_fadd_ph256(_Float16, __gcc_v16hf);
323 _Float16 __builtin_ia32_reduce_fmax_ph128(__gcc_v8hf);
324 _Float16 __builtin_ia32_reduce_fmax_ph256(__gcc_v16hf);
325 _Float16 __builtin_ia32_reduce_fmin_ph128(__gcc_v8hf);
326 _Float16 __builtin_ia32_reduce_fmin_ph256(__gcc_v16hf);
327 _Float16 __builtin_ia32_reduce_fmul_ph128(_Float16, __gcc_v8hf);
328 _Float16 __builtin_ia32_reduce_fmul_ph256(_Float16, __gcc_v16hf);
329 __gcc_v8hf __builtin_ia32_rndscaleph_128_mask(__gcc_v8hf, int, __gcc_v8hf, unsigned char);
330 __gcc_v16hf __builtin_ia32_rndscaleph_256_mask(__gcc_v16hf, int, __gcc_v16hf, unsigned short);
331 __gcc_v8hf __builtin_ia32_selectph_128(unsigned char, __gcc_v8hf, __gcc_v8hf);
332 __gcc_v16hf __builtin_ia32_selectph_256(unsigned short, __gcc_v16hf, __gcc_v16hf);
333 __gcc_v8hf __builtin_ia32_sqrtph(__gcc_v8hf);
334 __gcc_v16hf __builtin_ia32_sqrtph256(__gcc_v16hf);
335 __gcc_v8hf __builtin_ia32_vfmaddph(__gcc_v8hf, __gcc_v8hf, __gcc_v8hf);
336 __gcc_v16hf __builtin_ia32_vfmaddph256(__gcc_v16hf, __gcc_v16hf, __gcc_v16hf);
337 __gcc_v8hf __builtin_ia32_vfmaddsubph(__gcc_v8hf, __gcc_v8hf, __gcc_v8hf);
338 __gcc_v16hf __builtin_ia32_vfmaddsubph256(__gcc_v16hf, __gcc_v16hf, __gcc_v16hf);
339 // avx512ifma
340 __gcc_v8di __builtin_ia32_vpmadd52huq512(__gcc_v8di, __gcc_v8di, __gcc_v8di);
341 __gcc_v8di __builtin_ia32_vpmadd52luq512(__gcc_v8di, __gcc_v8di, __gcc_v8di);
342 // avx512ifma,avx512vl|avxifma
343 __gcc_v2di __builtin_ia32_vpmadd52huq128(__gcc_v2di, __gcc_v2di, __gcc_v2di);
344 __gcc_v4di __builtin_ia32_vpmadd52huq256(__gcc_v4di, __gcc_v4di, __gcc_v4di);
345 __gcc_v2di __builtin_ia32_vpmadd52luq128(__gcc_v2di, __gcc_v2di, __gcc_v2di);
346 __gcc_v4di __builtin_ia32_vpmadd52luq256(__gcc_v4di, __gcc_v4di, __gcc_v4di);
347 // avx512vbmi
348 __gcc_v64qi __builtin_ia32_permvarqi512(__gcc_v64qi, __gcc_v64qi);
349 __gcc_v64qi __builtin_ia32_vpermi2varqi512(__gcc_v64qi, __gcc_v64qi, __gcc_v64qi);
350 __gcc_v64qi __builtin_ia32_vpmultishiftqb512(__gcc_v64qi, __gcc_v64qi);
351 // avx512vbmi,avx512vl
352 __gcc_v16qi __builtin_ia32_permvarqi128(__gcc_v16qi, __gcc_v16qi);
353 __gcc_v32qi __builtin_ia32_permvarqi256(__gcc_v32qi, __gcc_v32qi);
354 __gcc_v16qi __builtin_ia32_vpermi2varqi128(__gcc_v16qi, __gcc_v16qi, __gcc_v16qi);
355 __gcc_v32qi __builtin_ia32_vpermi2varqi256(__gcc_v32qi, __gcc_v32qi, __gcc_v32qi);
356 __gcc_v16qi __builtin_ia32_vpmultishiftqb128(__gcc_v16qi, __gcc_v16qi);
357 __gcc_v32qi __builtin_ia32_vpmultishiftqb256(__gcc_v32qi, __gcc_v32qi);
358 // avx512vbmi2
359 void __builtin_ia32_compressstorehi512_mask(__gcc_v32hi *, __gcc_v32hi, unsigned int);
360 void __builtin_ia32_compressstoreqi512_mask(__gcc_v64qi *, __gcc_v64qi, unsigned long long int);
361 __gcc_v16si __builtin_ia32_vpshldd512(__gcc_v16si, __gcc_v16si, int);
362 __gcc_v8di __builtin_ia32_vpshldq512(__gcc_v8di, __gcc_v8di, int);
363 __gcc_v16si __builtin_ia32_vpshldvd512(__gcc_v16si, __gcc_v16si, __gcc_v16si);
364 __gcc_v8di __builtin_ia32_vpshldvq512(__gcc_v8di, __gcc_v8di, __gcc_v8di);
365 __gcc_v32hi __builtin_ia32_vpshldvw512(__gcc_v32hi, __gcc_v32hi, __gcc_v32hi);
366 __gcc_v32hi __builtin_ia32_vpshldw512(__gcc_v32hi, __gcc_v32hi, int);
367 __gcc_v16si __builtin_ia32_vpshrdd512(__gcc_v16si, __gcc_v16si, int);
368 __gcc_v8di __builtin_ia32_vpshrdq512(__gcc_v8di, __gcc_v8di, int);
369 __gcc_v16si __builtin_ia32_vpshrdvd512(__gcc_v16si, __gcc_v16si, __gcc_v16si);
370 __gcc_v8di __builtin_ia32_vpshrdvq512(__gcc_v8di, __gcc_v8di, __gcc_v8di);
371 __gcc_v32hi __builtin_ia32_vpshrdvw512(__gcc_v32hi, __gcc_v32hi, __gcc_v32hi);
372 __gcc_v32hi __builtin_ia32_vpshrdw512(__gcc_v32hi, __gcc_v32hi, int);
373 // avx512vl
374 __gcc_v4si __builtin_ia32_alignd128(__gcc_v4si, __gcc_v4si, int);
375 __gcc_v8si __builtin_ia32_alignd256(__gcc_v8si, __gcc_v8si, int);
376 __gcc_v2di __builtin_ia32_alignq128(__gcc_v2di, __gcc_v2di, int);
377 __gcc_v4di __builtin_ia32_alignq256(__gcc_v4di, __gcc_v4di, int);
378 __gcc_v8sf __builtin_ia32_insertf32x4_256(__gcc_v8sf, __gcc_v4sf, int);
379 __gcc_v8si __builtin_ia32_inserti32x4_256(__gcc_v8si, __gcc_v4si, int);
380 __gcc_v4df __builtin_ia32_permvardf256(__gcc_v4df, __gcc_v4di);
381 __gcc_v4di __builtin_ia32_permvardi256(__gcc_v4di, __gcc_v4di);
382 __gcc_v4si __builtin_ia32_prold128(__gcc_v4si, int);
383 __gcc_v8si __builtin_ia32_prold256(__gcc_v8si, int);
384 __gcc_v2di __builtin_ia32_prolq128(__gcc_v2di, int);
385 __gcc_v4di __builtin_ia32_prolq256(__gcc_v4di, int);
386 __gcc_v4si __builtin_ia32_prolvd128(__gcc_v4si, __gcc_v4si);
387 __gcc_v8si __builtin_ia32_prolvd256(__gcc_v8si, __gcc_v8si);
388 __gcc_v2di __builtin_ia32_prolvq128(__gcc_v2di, __gcc_v2di);
389 __gcc_v4di __builtin_ia32_prolvq256(__gcc_v4di, __gcc_v4di);
390 __gcc_v4si __builtin_ia32_prord128(__gcc_v4si, int);
391 __gcc_v8si __builtin_ia32_prord256(__gcc_v8si, int);
392 __gcc_v2di __builtin_ia32_prorq128(__gcc_v2di, int);
393 __gcc_v4di __builtin_ia32_prorq256(__gcc_v4di, int);
394 __gcc_v4si __builtin_ia32_prorvd128(__gcc_v4si, __gcc_v4si);
395 __gcc_v8si __builtin_ia32_prorvd256(__gcc_v8si, __gcc_v8si);
396 __gcc_v2di __builtin_ia32_prorvq128(__gcc_v2di, __gcc_v2di);
397 __gcc_v4di __builtin_ia32_prorvq256(__gcc_v4di, __gcc_v4di);
398 __gcc_v2di __builtin_ia32_psraq128(__gcc_v2di, __gcc_v2di);
399 __gcc_v4di __builtin_ia32_psraq256(__gcc_v4di, __gcc_v2di);
400 __gcc_v2di __builtin_ia32_psraqi128(__gcc_v2di, int);
401 __gcc_v4di __builtin_ia32_psraqi256(__gcc_v4di, int);
402 __gcc_v2di __builtin_ia32_psravq128(__gcc_v2di, __gcc_v2di);
403 __gcc_v4di __builtin_ia32_psravq256(__gcc_v4di, __gcc_v4di);
404 __gcc_v2di __builtin_ia32_selectq_128(unsigned char, __gcc_v2di, __gcc_v2di);
405 __gcc_v4di __builtin_ia32_selectq_256(unsigned char, __gcc_v4di, __gcc_v4di);
406 __gcc_v8sf __builtin_ia32_shuf_f32x4_256(__gcc_v8sf, __gcc_v8sf, int);
407 __gcc_v4df __builtin_ia32_shuf_f64x2_256(__gcc_v4df, __gcc_v4df, int);
408 __gcc_v8si __builtin_ia32_shuf_i32x4_256(__gcc_v8si, __gcc_v8si, int);
409 __gcc_v4di __builtin_ia32_shuf_i64x2_256(__gcc_v4di, __gcc_v4di, int);
410 __gcc_v4si __builtin_ia32_vpermi2vard128(__gcc_v4si, __gcc_v4si, __gcc_v4si);
411 __gcc_v8si __builtin_ia32_vpermi2vard256(__gcc_v8si, __gcc_v8si, __gcc_v8si);
412 __gcc_v2df __builtin_ia32_vpermi2varpd128(__gcc_v2df, __gcc_v2di, __gcc_v2df);
413 __gcc_v4df __builtin_ia32_vpermi2varpd256(__gcc_v4df, __gcc_v4di, __gcc_v4df);
414 __gcc_v4sf __builtin_ia32_vpermi2varps128(__gcc_v4sf, __gcc_v4si, __gcc_v4sf);
415 __gcc_v8sf __builtin_ia32_vpermi2varps256(__gcc_v8sf, __gcc_v8si, __gcc_v8sf);
416 __gcc_v2di __builtin_ia32_vpermi2varq128(__gcc_v2di, __gcc_v2di, __gcc_v2di);
417 __gcc_v4di __builtin_ia32_vpermi2varq256(__gcc_v4di, __gcc_v4di, __gcc_v4di);
418 // avx512vl,avx512bitalg
419 __gcc_v16qi __builtin_ia32_vpopcntb_128(__gcc_v16qi);
420 __gcc_v32qi __builtin_ia32_vpopcntb_256(__gcc_v32qi);
421 __gcc_v8hi __builtin_ia32_vpopcntw_128(__gcc_v8hi);
422 __gcc_v16hi __builtin_ia32_vpopcntw_256(__gcc_v16hi);
423 // avx512vl,avx512bw
424 __gcc_v8hi __builtin_ia32_vpermi2varhi128(__gcc_v8hi, __gcc_v8hi, __gcc_v8hi);
425 __gcc_v16hi __builtin_ia32_vpermi2varhi256(__gcc_v16hi, __gcc_v16hi, __gcc_v16hi);
426 // avx512vl,avx512vbmi2
427 void __builtin_ia32_compressstorehi128_mask(__gcc_v8hi *, __gcc_v8hi, unsigned char);
428 void __builtin_ia32_compressstorehi256_mask(__gcc_v16hi *, __gcc_v16hi, unsigned short);
429 void __builtin_ia32_compressstoreqi128_mask(__gcc_v16qi *, __gcc_v16qi, unsigned short);
430 void __builtin_ia32_compressstoreqi256_mask(__gcc_v32qi *, __gcc_v32qi, unsigned int);
431 __gcc_v4si __builtin_ia32_vpshldd128(__gcc_v4si, __gcc_v4si, int);
432 __gcc_v8si __builtin_ia32_vpshldd256(__gcc_v8si, __gcc_v8si, int);
433 __gcc_v2di __builtin_ia32_vpshldq128(__gcc_v2di, __gcc_v2di, int);
434 __gcc_v4di __builtin_ia32_vpshldq256(__gcc_v4di, __gcc_v4di, int);
435 __gcc_v4si __builtin_ia32_vpshldvd128(__gcc_v4si, __gcc_v4si, __gcc_v4si);
436 __gcc_v8si __builtin_ia32_vpshldvd256(__gcc_v8si, __gcc_v8si, __gcc_v8si);
437 __gcc_v2di __builtin_ia32_vpshldvq128(__gcc_v2di, __gcc_v2di, __gcc_v2di);
438 __gcc_v4di __builtin_ia32_vpshldvq256(__gcc_v4di, __gcc_v4di, __gcc_v4di);
439 __gcc_v8hi __builtin_ia32_vpshldvw128(__gcc_v8hi, __gcc_v8hi, __gcc_v8hi);
440 __gcc_v16hi __builtin_ia32_vpshldvw256(__gcc_v16hi, __gcc_v16hi, __gcc_v16hi);
441 __gcc_v8hi __builtin_ia32_vpshldw128(__gcc_v8hi, __gcc_v8hi, int);
442 __gcc_v16hi __builtin_ia32_vpshldw256(__gcc_v16hi, __gcc_v16hi, int);
443 __gcc_v4si __builtin_ia32_vpshrdd128(__gcc_v4si, __gcc_v4si, int);
444 __gcc_v8si __builtin_ia32_vpshrdd256(__gcc_v8si, __gcc_v8si, int);
445 __gcc_v2di __builtin_ia32_vpshrdq128(__gcc_v2di, __gcc_v2di, int);
446 __gcc_v4di __builtin_ia32_vpshrdq256(__gcc_v4di, __gcc_v4di, int);
447 __gcc_v4si __builtin_ia32_vpshrdvd128(__gcc_v4si, __gcc_v4si, __gcc_v4si);
448 __gcc_v8si __builtin_ia32_vpshrdvd256(__gcc_v8si, __gcc_v8si, __gcc_v8si);
449 __gcc_v2di __builtin_ia32_vpshrdvq128(__gcc_v2di, __gcc_v2di, __gcc_v2di);
450 __gcc_v4di __builtin_ia32_vpshrdvq256(__gcc_v4di, __gcc_v4di, __gcc_v4di);
451 __gcc_v8hi __builtin_ia32_vpshrdvw128(__gcc_v8hi, __gcc_v8hi, __gcc_v8hi);
452 __gcc_v16hi __builtin_ia32_vpshrdvw256(__gcc_v16hi, __gcc_v16hi, __gcc_v16hi);
453 __gcc_v8hi __builtin_ia32_vpshrdw128(__gcc_v8hi, __gcc_v8hi, int);
454 __gcc_v16hi __builtin_ia32_vpshrdw256(__gcc_v16hi, __gcc_v16hi, int);
455 // avx512vl,avx512vnni|avxvnni
456 __gcc_v4si __builtin_ia32_vpdpbusd128(__gcc_v4si, __gcc_v4si, __gcc_v4si);
457 __gcc_v8si __builtin_ia32_vpdpbusd256(__gcc_v8si, __gcc_v8si, __gcc_v8si);
458 __gcc_v4si __builtin_ia32_vpdpbusds128(__gcc_v4si, __gcc_v4si, __gcc_v4si);
459 __gcc_v8si __builtin_ia32_vpdpbusds256(__gcc_v8si, __gcc_v8si, __gcc_v8si);
460 __gcc_v4si __builtin_ia32_vpdpwssd128(__gcc_v4si, __gcc_v4si, __gcc_v4si);
461 __gcc_v8si __builtin_ia32_vpdpwssd256(__gcc_v8si, __gcc_v8si, __gcc_v8si);
462 __gcc_v4si __builtin_ia32_vpdpwssds128(__gcc_v4si, __gcc_v4si, __gcc_v4si);
463 __gcc_v8si __builtin_ia32_vpdpwssds256(__gcc_v8si, __gcc_v8si, __gcc_v8si);
464 // avx512vnni
465 __gcc_v16si __builtin_ia32_vpdpbusd512(__gcc_v16si, __gcc_v16si, __gcc_v16si);
466 __gcc_v16si __builtin_ia32_vpdpbusds512(__gcc_v16si, __gcc_v16si, __gcc_v16si);
467 __gcc_v16si __builtin_ia32_vpdpwssd512(__gcc_v16si, __gcc_v16si, __gcc_v16si);
468 __gcc_v16si __builtin_ia32_vpdpwssds512(__gcc_v16si, __gcc_v16si, __gcc_v16si);
469 // avx512vp2intersect
470 void __builtin_ia32_vp2intersect_q_512(__gcc_v8di, __gcc_v8di, unsigned char *, unsigned char *);
471 // avx512vp2intersect,avx512vl
472 void __builtin_ia32_vp2intersect_q_128(__gcc_v2di, __gcc_v2di, unsigned char *, unsigned char *);
473 void __builtin_ia32_vp2intersect_q_256(__gcc_v4di, __gcc_v4di, unsigned char *, unsigned char *);
474 // avx512vpopcntdq
475 __gcc_v16si __builtin_ia32_vpopcntd_512(__gcc_v16si);
476 __gcc_v8di __builtin_ia32_vpopcntq_512(__gcc_v8di);
477 // avx512vpopcntdq,avx512vl
478 __gcc_v4si __builtin_ia32_vpopcntd_128(__gcc_v4si);
479 __gcc_v8si __builtin_ia32_vpopcntd_256(__gcc_v8si);
480 __gcc_v2di __builtin_ia32_vpopcntq_128(__gcc_v2di);
481 __gcc_v4di __builtin_ia32_vpopcntq_256(__gcc_v4di);
482 // avxneconvert
483 __gcc_v4sf __builtin_ia32_vbcstnebf162ps128(const _Float16 *);
484 __gcc_v8sf __builtin_ia32_vbcstnebf162ps256(const _Float16 *);
485 __gcc_v4sf __builtin_ia32_vbcstnesh2ps128(const _Float16 *);
486 __gcc_v8sf __builtin_ia32_vbcstnesh2ps256(const _Float16 *);
487 __gcc_v4sf __builtin_ia32_vcvtneebf162ps128(const __gcc_v8hf *);
488 __gcc_v8sf __builtin_ia32_vcvtneebf162ps256(const __gcc_v16hf *);
489 __gcc_v4sf __builtin_ia32_vcvtneeph2ps128(const __gcc_v8hf *);
490 __gcc_v8sf __builtin_ia32_vcvtneeph2ps256(const __gcc_v16hf *);
491 __gcc_v4sf __builtin_ia32_vcvtneobf162ps128(const __gcc_v8hf *);
492 __gcc_v8sf __builtin_ia32_vcvtneobf162ps256(const __gcc_v16hf *);
493 __gcc_v4sf __builtin_ia32_vcvtneoph2ps128(const __gcc_v8hf *);
494 __gcc_v8sf __builtin_ia32_vcvtneoph2ps256(const __gcc_v16hf *);
495 // avxvnniint8
496 __gcc_v4si __builtin_ia32_vpdpbssd128(__gcc_v4si, __gcc_v4si, __gcc_v4si);
497 __gcc_v8si __builtin_ia32_vpdpbssd256(__gcc_v8si, __gcc_v8si, __gcc_v8si);
498 __gcc_v4si __builtin_ia32_vpdpbssds128(__gcc_v4si, __gcc_v4si, __gcc_v4si);
499 __gcc_v8si __builtin_ia32_vpdpbssds256(__gcc_v8si, __gcc_v8si, __gcc_v8si);
500 __gcc_v4si __builtin_ia32_vpdpbsud128(__gcc_v4si, __gcc_v4si, __gcc_v4si);
501 __gcc_v8si __builtin_ia32_vpdpbsud256(__gcc_v8si, __gcc_v8si, __gcc_v8si);
502 __gcc_v4si __builtin_ia32_vpdpbsuds128(__gcc_v4si, __gcc_v4si, __gcc_v4si);
503 __gcc_v8si __builtin_ia32_vpdpbsuds256(__gcc_v8si, __gcc_v8si, __gcc_v8si);
504 __gcc_v4si __builtin_ia32_vpdpbuud128(__gcc_v4si, __gcc_v4si, __gcc_v4si);
505 __gcc_v8si __builtin_ia32_vpdpbuud256(__gcc_v8si, __gcc_v8si, __gcc_v8si);
506 __gcc_v4si __builtin_ia32_vpdpbuuds128(__gcc_v4si, __gcc_v4si, __gcc_v4si);
507 __gcc_v8si __builtin_ia32_vpdpbuuds256(__gcc_v8si, __gcc_v8si, __gcc_v8si);
508 // clang
509 unsigned int __builtin_ia32_readeflags_u32(void);
510 unsigned char __builtin_ia32_subborrow_u32(unsigned char, unsigned int, unsigned int, unsigned int *);
511 unsigned char __builtin_ia32_subborrow_u64(unsigned char, unsigned long long int, unsigned long long int, unsigned long long int *);
513 // cmpccxadd
514 signed int __builtin_ia32_cmpccxadd32(void *, signed int, signed int, int);
515 signed long long int __builtin_ia32_cmpccxadd64(void *, signed long long int, signed long long int, int);
516 // fma4
517 __gcc_v2df __builtin_ia32_vfmaddsd(__gcc_v2df, __gcc_v2df, __gcc_v2df);
518 __gcc_v4sf __builtin_ia32_vfmaddss(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf);
519 // invpcid
520 void __builtin_ia32_invpcid(unsigned int, void *);
521 void __builtin_ia32_directstore_u32(unsigned int *, unsigned int);
522 void __builtin_ia32_directstore_u64(unsigned long int *, unsigned long int);
523 void __builtin_ia32_prefetchi(const void *, unsigned int);
524 void __builtin_ia32_aadd32(void *, signed int);
525 void __builtin_ia32_aadd64(void *, signed long long int);
526 void __builtin_ia32_aand32(void *, signed int);
527 void __builtin_ia32_aand64(void *, signed long long int);
528 void __builtin_ia32_aor32(void *, signed int);
529 void __builtin_ia32_aor64(void *, signed long long int);
530 void __builtin_ia32_axor32(void *, signed int);
531 void __builtin_ia32_axor64(void *, signed long long int);
532 unsigned long long int __builtin_ia32_rdpru(int);
533 // rdseed
534 unsigned int __builtin_ia32_rdseed16_step(unsigned short *);
535 unsigned int __builtin_ia32_rdseed32_step(unsigned int *);
536 unsigned int __builtin_ia32_rdseed64_step(unsigned long long int *);
537 // sse2
538 __gcc_v2di __builtin_ia32_pslldqi128_byteshift(__gcc_v2di, int);
539 __gcc_v2di __builtin_ia32_psrldqi128_byteshift(__gcc_v2di, int);
540 __gcc_v4di __builtin_ia32_aesdec256(__gcc_v4di, __gcc_v4di);
541 __gcc_v4di __builtin_ia32_aesdeclast256(__gcc_v4di, __gcc_v4di);
542 __gcc_v4di __builtin_ia32_aesenc256(__gcc_v4di, __gcc_v4di);
543 __gcc_v4di __builtin_ia32_aesenclast256(__gcc_v4di, __gcc_v4di);
544 // vpclmulqdq
545 __gcc_v4di __builtin_ia32_pclmulqdq256(__gcc_v4di, __gcc_v4di, char);
546 // xop
547 __gcc_v16qi __builtin_ia32_vpcomb(__gcc_v16qi, __gcc_v16qi, char);
548 __gcc_v4si __builtin_ia32_vpcomd(__gcc_v4si, __gcc_v4si, char);
549 __gcc_v2di __builtin_ia32_vpcomq(__gcc_v2di, __gcc_v2di, char);
550 __gcc_v16qi __builtin_ia32_vpcomub(__gcc_v16qi, __gcc_v16qi, char);
551 __gcc_v4si __builtin_ia32_vpcomud(__gcc_v4si, __gcc_v4si, char);
552 __gcc_v2di __builtin_ia32_vpcomuq(__gcc_v2di, __gcc_v2di, char);
553 __gcc_v8hi __builtin_ia32_vpcomuw(__gcc_v8hi, __gcc_v8hi, char);
554 __gcc_v8hi __builtin_ia32_vpcomw(__gcc_v8hi, __gcc_v8hi, char);
555 __gcc_v16qi __builtin_ia32_vprotbi(__gcc_v16qi, char);
556 __gcc_v4si __builtin_ia32_vprotdi(__gcc_v4si, char);
557 __gcc_v2di __builtin_ia32_vprotqi(__gcc_v2di, char);
558 __gcc_v8hi __builtin_ia32_vprotwi(__gcc_v8hi, char);
559 // clang-format on
__gcc_v8df __builtin_ia32_insertf64x4(__gcc_v8df, __gcc_v4df, int)
__gcc_v4sf __builtin_ia32_sqrtss_round_mask(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int)
__gcc_v8di __builtin_ia32_aesdec512(__gcc_v8di, __gcc_v8di)
__gcc_v32hf __builtin_ia32_maxph512(__gcc_v32hf, __gcc_v32hf, int)
__gcc_v4di __builtin_ia32_inserti64x2_256(__gcc_v4di, __gcc_v2di, int)
float __builtin_ia32_reduce_fadd_ps512(float, __gcc_v16sf)
__gcc_v8sf __builtin_ia32_vpermi2varps256(__gcc_v8sf, __gcc_v8si, __gcc_v8sf)
_Float16 __builtin_ia32_reduce_fadd_ph256(_Float16, __gcc_v16hf)
__gcc_v4sf __builtin_ia32_gatherq_ps(__gcc_v4sf, const float *, __gcc_v2di, __gcc_v4sf, char)
__gcc_v8hf __builtin_ia32_vcvtusi2sh(__gcc_v8hf, unsigned int, int)
__gcc_v4di __builtin_ia32_psravq256(__gcc_v4di, __gcc_v4di)
__gcc_v2di __builtin_ia32_vprotqi(__gcc_v2di, char)
void __builtin_ia32_storess128_mask(__gcc_v4sf *, __gcc_v4sf, unsigned char)
__gcc_v2di __builtin_ia32_selectq_128(unsigned char, __gcc_v2di, __gcc_v2di)
__gcc_v4di __builtin_ia32_vpmadd52luq256(__gcc_v4di, __gcc_v4di, __gcc_v4di)
void __builtin_ia32_vp2intersect_q_128(__gcc_v2di, __gcc_v2di, unsigned char *, unsigned char *)
__gcc_v8di __builtin_ia32_vcvttph2qq512_mask(__gcc_v8hf, __gcc_v8di, unsigned char, int)
__gcc_v8hf __builtin_ia32_getmantsh_round_mask(__gcc_v8hf, __gcc_v8hf, int, __gcc_v8hf, unsigned char, int)
unsigned int __builtin_ia32_readeflags_u32(void)
int __builtin_ia32_vec_ext_v8si(__gcc_v8si, int)
__gcc_v4di __builtin_ia32_psrldqi256_byteshift(__gcc_v4di, int)
__gcc_v4sf __builtin_ia32_vpermi2varps128(__gcc_v4sf, __gcc_v4si, __gcc_v4sf)
_Float16 __builtin_ia32_reduce_fmul_ph256(_Float16, __gcc_v16hf)
__gcc_v4di __builtin_ia32_prolq256(__gcc_v4di, int)
__gcc_v4sf __builtin_ia32_mulss_round_mask(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int)
__gcc_v2di __builtin_ia32_psrldqi128_byteshift(__gcc_v2di, int)
__gcc_v8si __builtin_ia32_vpdpbusd256(__gcc_v8si, __gcc_v8si, __gcc_v8si)
__gcc_v2df __builtin_ia32_addsd_round_mask(__gcc_v2df, __gcc_v2df, __gcc_v2df, unsigned char, int)
__gcc_v4si __builtin_ia32_prord128(__gcc_v4si, int)
__gcc_v8si __builtin_ia32_prorvd256(__gcc_v8si, __gcc_v8si)
__gcc_v8hf __builtin_ia32_vcvtneps2bf16256(__gcc_v8sf)
__gcc_v8hf __builtin_ia32_selectph_128(unsigned char, __gcc_v8hf, __gcc_v8hf)
__gcc_v16hi __builtin_ia32_vpshrdw256(__gcc_v16hi, __gcc_v16hi, int)
__gcc_v4df __builtin_ia32_insertf64x2_256(__gcc_v4df, __gcc_v2df, int)
__gcc_v16qi __builtin_ia32_vpopcntb_128(__gcc_v16qi)
__gcc_v8sf __builtin_ia32_insertf32x4_256(__gcc_v8sf, __gcc_v4sf, int)
__gcc_v4sf __builtin_ia32_vfmaddss(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf)
__gcc_v8hi __builtin_ia32_psrav8hi(__gcc_v8hi, __gcc_v8hi)
__gcc_v32hi __builtin_ia32_psllv32hi(__gcc_v32hi, __gcc_v32hi)
__gcc_v4di __builtin_ia32_permvardi256(__gcc_v4di, __gcc_v4di)
__gcc_v4sf __builtin_ia32_getexpss128_round_mask(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int)
double __builtin_ia32_reduce_fmax_pd512(__gcc_v8df)
__gcc_v16sf __builtin_ia32_vfmaddcph512_mask(__gcc_v16sf, __gcc_v16sf, __gcc_v16sf, unsigned short, int)
__gcc_v16si __builtin_ia32_pmaddwd512(__gcc_v32hi, __gcc_v32hi)
__gcc_v8di __builtin_ia32_inserti64x4(__gcc_v8di, __gcc_v4di, int)
__gcc_v8hf __builtin_ia32_vcvtsi2sh(__gcc_v8hf, int, int)
unsigned long long int __builtin_ia32_vcvtsh2usi64(__gcc_v8hf, int)
__gcc_v4si __builtin_ia32_vprotdi(__gcc_v4si, char)
__gcc_v32uhi __builtin_ia32_vcvtph2uw512_mask(__gcc_v32hf, __gcc_v32uhi, unsigned int, int)
unsigned int __builtin_ia32_vcvttsh2usi32(__gcc_v8hf, int)
__gcc_v32hi __builtin_ia32_vpshldvw512(__gcc_v32hi, __gcc_v32hi, __gcc_v32hi)
__gcc_v4sf __builtin_ia32_vcvtsh2ss_round_mask(__gcc_v4sf, __gcc_v8hf, __gcc_v4sf, unsigned char, int)
__gcc_v16hf __builtin_ia32_selectph_256(unsigned short, __gcc_v16hf, __gcc_v16hf)
__gcc_v16si __builtin_ia32_psllv16si(__gcc_v16si, __gcc_v16si)
__gcc_v4si __builtin_ia32_vpshrdvd128(__gcc_v4si, __gcc_v4si, __gcc_v4si)
__gcc_v2df __builtin_ia32_vcvtsh2sd_round_mask(__gcc_v2df, __gcc_v8hf, __gcc_v2df, unsigned char, int)
_Float16 __builtin_ia32_reduce_fadd_ph128(_Float16, __gcc_v8hf)
__gcc_v8hf __builtin_ia32_vcvtsd2sh_round_mask(__gcc_v8hf, __gcc_v2df, __gcc_v8hf, unsigned char, int)
__gcc_v4si __builtin_ia32_prorvd128(__gcc_v4si, __gcc_v4si)
__gcc_v8udi __builtin_ia32_vcvttph2uqq512_mask(__gcc_v8hf, __gcc_v8udi, unsigned char, int)
double __builtin_ia32_reduce_fadd_pd512(double, __gcc_v8df)
__gcc_v2di __builtin_ia32_alignq128(__gcc_v2di, __gcc_v2di, int)
__gcc_v4si __builtin_ia32_vpshrdd128(__gcc_v4si, __gcc_v4si, int)
__gcc_v4sf __builtin_ia32_vfcmulcsh_mask(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int)
_Float16 __builtin_ia32_reduce_fmax_ph128(__gcc_v8hf)
__gcc_v32hf __builtin_ia32_reduceph512_mask(__gcc_v32hf, int, __gcc_v32hf, unsigned int, int)
__gcc_v4si __builtin_ia32_gatherd_d(__gcc_v4si, const int *, __gcc_v4si, __gcc_v4si, char)
void __builtin_ia32_compressstorehi128_mask(__gcc_v8hi *, __gcc_v8hi, unsigned char)
__gcc_v4sf __builtin_ia32_maxss_round_mask(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int)
unsigned int __builtin_ia32_cmpph512_mask(__gcc_v32hf, __gcc_v32hf, int, unsigned int, int)
__gcc_v8di __builtin_ia32_alignq512(__gcc_v8di, __gcc_v8di, int)
__gcc_v8hf __builtin_ia32_minsh_round_mask(__gcc_v8hf, __gcc_v8hf, __gcc_v8hf, unsigned char, int)
__gcc_v8di __builtin_ia32_psrldqi512_byteshift(__gcc_v8di, int)
__gcc_v4sf __builtin_ia32_vfcmaddcsh_round_mask3(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int)
unsigned char __builtin_ia32_subborrow_u32(unsigned char, unsigned int, unsigned int, unsigned int *)
__gcc_v32hf __builtin_ia32_vcvtw2ph512_mask(__gcc_v32hi, __gcc_v32hf, unsigned int, int)
__gcc_v8si __builtin_ia32_vpopcntd_256(__gcc_v8si)
__gcc_v8di __builtin_ia32_psllq512(__gcc_v8di, __gcc_v2di)
__gcc_v16sf __builtin_ia32_insertf32x4(__gcc_v16sf, __gcc_v4sf, int)
__gcc_v8hi __builtin_ia32_psllv8hi(__gcc_v8hi, __gcc_v8hi)
__gcc_v2df __builtin_ia32_mulsd_round_mask(__gcc_v2df, __gcc_v2df, __gcc_v2df, unsigned char, int)
__gcc_v2di __builtin_ia32_vplzcntq_128(__gcc_v2di)
__gcc_v2df __builtin_ia32_vfmaddsd(__gcc_v2df, __gcc_v2df, __gcc_v2df)
__gcc_v4df __builtin_ia32_gatherq_pd256(__gcc_v4df, const double *, __gcc_v4di, __gcc_v4df, char)
__gcc_v16sf __builtin_ia32_shufps512(__gcc_v16sf, __gcc_v16sf, int)
__gcc_v16sf __builtin_ia32_vpermi2varps512(__gcc_v16sf, __gcc_v16si, __gcc_v16sf)
__gcc_v4di __builtin_ia32_vpermi2varq256(__gcc_v4di, __gcc_v4di, __gcc_v4di)
__gcc_v8di __builtin_ia32_aesenclast512(__gcc_v8di, __gcc_v8di)
__gcc_v16si __builtin_ia32_vpconflictsi_512(__gcc_v16si)
__gcc_v8hf __builtin_ia32_vcvtsi642sh(__gcc_v8hf, long long int, int)
__gcc_v8si __builtin_ia32_vpdpbuud256(__gcc_v8si, __gcc_v8si, __gcc_v8si)
__gcc_v32hi __builtin_ia32_psllw512(__gcc_v32hi, __gcc_v8hi)
__gcc_v8hf __builtin_ia32_vfmaddph(__gcc_v8hf, __gcc_v8hf, __gcc_v8hf)
double __builtin_ia32_reduce_fmin_pd512(__gcc_v8df)
__gcc_v4sf __builtin_ia32_vfmaddcsh_round_mask3(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int)
__gcc_v8hf __builtin_ia32_maxph128(__gcc_v8hf, __gcc_v8hf)
__gcc_v4di __builtin_ia32_vplzcntq_256(__gcc_v4di)
long long int __builtin_ia32_vec_ext_v4di(__gcc_v4di, int)
__gcc_v2di __builtin_ia32_psraq128(__gcc_v2di, __gcc_v2di)
__gcc_v32hi __builtin_ia32_psrlwi512(__gcc_v32hi, int)
__gcc_v4di __builtin_ia32_vpshrdvq256(__gcc_v4di, __gcc_v4di, __gcc_v4di)
__gcc_v8sf __builtin_ia32_vbcstnesh2ps256(const _Float16 *)
__gcc_v4di __builtin_ia32_aesdec256(__gcc_v4di, __gcc_v4di)
__gcc_v64qi __builtin_ia32_packsswb512(__gcc_v32hi, __gcc_v32hi)
__gcc_v8di __builtin_ia32_selectq_512(unsigned char, __gcc_v8di, __gcc_v8di)
void __builtin_ia32_compressstoreqi128_mask(__gcc_v16qi *, __gcc_v16qi, unsigned short)
unsigned char __builtin_ia32_subborrow_u64(unsigned char, unsigned long long int, unsigned long long int, unsigned long long int *)
__gcc_v2di __builtin_ia32_vpopcntq_128(__gcc_v2di)
__gcc_v8si __builtin_ia32_alignd256(__gcc_v8si, __gcc_v8si, int)
__gcc_v32hi __builtin_ia32_pmaddubsw512(__gcc_v64qi, __gcc_v64qi)
__gcc_v4si __builtin_ia32_vpdpbssds128(__gcc_v4si, __gcc_v4si, __gcc_v4si)
__gcc_v4si __builtin_ia32_prolvd128(__gcc_v4si, __gcc_v4si)
__gcc_v16hf __builtin_ia32_sqrtph256(__gcc_v16hf)
__gcc_v8df __builtin_ia32_vpermilpd512(__gcc_v8df, int)
int __builtin_ia32_vcvtsh2si32(__gcc_v8hf, int)
__gcc_v8si __builtin_ia32_vplzcntd_256(__gcc_v8si)
__gcc_v4si __builtin_ia32_vpdpbuuds128(__gcc_v4si, __gcc_v4si, __gcc_v4si)
char __builtin_ia32_vec_ext_v32qi(__gcc_v32qi, int)
void __builtin_ia32_storesh128_mask(__gcc_v8hf *, __gcc_v8hf, unsigned char)
__gcc_v4si __builtin_ia32_gatherq_d(__gcc_v4si, const int *, __gcc_v2di, __gcc_v4si, char)
__gcc_v8udi __builtin_ia32_vcvtph2uqq512_mask(__gcc_v8hf, __gcc_v8udi, unsigned char, int)
__gcc_v16sf __builtin_ia32_divps512(__gcc_v16sf, __gcc_v16sf, int)
__gcc_v16si __builtin_ia32_vcvtph2dq512_mask(__gcc_v16hf, __gcc_v16si, unsigned short, int)
__gcc_v2df __builtin_ia32_rangesd128_round_mask(__gcc_v2df, __gcc_v2df, __gcc_v2df, unsigned char, int, int)
__gcc_v4si __builtin_ia32_vpcomd(__gcc_v4si, __gcc_v4si, char)
__gcc_v32qi __builtin_ia32_vpmultishiftqb256(__gcc_v32qi, __gcc_v32qi)
__gcc_v16hi __builtin_ia32_permvarhi256(__gcc_v16hi, __gcc_v16hi)
__gcc_v4si __builtin_ia32_alignd128(__gcc_v4si, __gcc_v4si, int)
__gcc_v32hi __builtin_ia32_pmulhuw512(__gcc_v32hi, __gcc_v32hi)
void __builtin_ia32_aand64(void *, signed long long int)
__gcc_v8hi __builtin_ia32_vprotwi(__gcc_v8hi, char)
__gcc_v8di __builtin_ia32_psrav8di(__gcc_v8di, __gcc_v8di)
__gcc_v8si __builtin_ia32_prold256(__gcc_v8si, int)
__gcc_v32uhi __builtin_ia32_vcvttph2uw512_mask(__gcc_v32hf, __gcc_v32uhi, unsigned int, int)
__gcc_v16hf __builtin_ia32_minph256(__gcc_v16hf, __gcc_v16hf)
void __builtin_ia32_aadd32(void *, signed int)
__gcc_v16sf __builtin_ia32_permvarsf512(__gcc_v16sf, __gcc_v16si)
__gcc_v2df __builtin_ia32_rsqrt28sd_round_mask(__gcc_v2df, __gcc_v2df, __gcc_v2df, unsigned char, int)
__gcc_v8si __builtin_ia32_vpshrdvd256(__gcc_v8si, __gcc_v8si, __gcc_v8si)
__gcc_v2df __builtin_ia32_getmantsd_round_mask(__gcc_v2df, __gcc_v2df, int, __gcc_v2df, unsigned char, int)
unsigned int __builtin_ia32_rdseed16_step(unsigned short *)
__gcc_v8hf __builtin_ia32_vcvtuqq2ph512_mask(__gcc_v8udi, __gcc_v8hf, unsigned char, int)
__gcc_v32hi __builtin_ia32_pshuflw512(__gcc_v32hi, int)
__gcc_v2df __builtin_ia32_rndscalesd_round_mask(__gcc_v2df, __gcc_v2df, __gcc_v2df, unsigned char, int, int)
__gcc_v8di __builtin_ia32_vpermi2varq512(__gcc_v8di, __gcc_v8di, __gcc_v8di)
__gcc_v4di __builtin_ia32_aesdeclast256(__gcc_v4di, __gcc_v4di)
__gcc_v4di __builtin_ia32_gatherq_q256(__gcc_v4di, const long long int *, __gcc_v4di, __gcc_v4di, char)
__gcc_v4df __builtin_ia32_gatherd_pd256(__gcc_v4df, const double *, __gcc_v4si, __gcc_v4df, char)
__gcc_v8hf __builtin_ia32_getexpsh128_round_mask(__gcc_v8hf, __gcc_v8hf, __gcc_v8hf, unsigned char, int)
__gcc_v2di __builtin_ia32_psraqi128(__gcc_v2di, int)
__gcc_v8di __builtin_ia32_vpshrdq512(__gcc_v8di, __gcc_v8di, int)
__gcc_v8hf __builtin_ia32_rndscaleph_128_mask(__gcc_v8hf, int, __gcc_v8hf, unsigned char)
void __builtin_ia32_tdpfp16ps(unsigned char, unsigned char, unsigned char)
__gcc_v4di __builtin_ia32_gatherd_q256(__gcc_v4di, const long long int *, __gcc_v4si, __gcc_v4di, char)
__gcc_v16sf __builtin_ia32_addps512(__gcc_v16sf, __gcc_v16sf, int)
__gcc_v16hi __builtin_ia32_vpshldw256(__gcc_v16hi, __gcc_v16hi, int)
__gcc_v8hf __builtin_ia32_selectpbf_128(unsigned char, __gcc_v8hf, __gcc_v8hf)
__gcc_v2di __builtin_ia32_vpshrdvq128(__gcc_v2di, __gcc_v2di, __gcc_v2di)
__gcc_v2di __builtin_ia32_prorvq128(__gcc_v2di, __gcc_v2di)
void __builtin_ia32_aand32(void *, signed int)
__gcc_v16si __builtin_ia32_vpshldd512(__gcc_v16si, __gcc_v16si, int)
__gcc_v4si __builtin_ia32_vpermi2vard128(__gcc_v4si, __gcc_v4si, __gcc_v4si)
__gcc_v32hi __builtin_ia32_vpshrdw512(__gcc_v32hi, __gcc_v32hi, int)
__gcc_v16sf __builtin_ia32_vpermilps512(__gcc_v16sf, int)
__gcc_v16sf __builtin_ia32_vfmulcph512_mask(__gcc_v16sf, __gcc_v16sf, __gcc_v16sf, unsigned short, int)
__gcc_v8si __builtin_ia32_vpdpbsud256(__gcc_v8si, __gcc_v8si, __gcc_v8si)
__gcc_v8hf __builtin_ia32_vcvtusi642sh(__gcc_v8hf, unsigned long long int, int)
_Float16 __builtin_ia32_reduce_fmin_ph256(__gcc_v16hf)
__gcc_v64qi __builtin_ia32_vpopcntb_512(__gcc_v64qi)
__gcc_v32hi __builtin_ia32_psrlw512(__gcc_v32hi, __gcc_v8hi)
__gcc_v32hf __builtin_ia32_vcvtuw2ph512_mask(__gcc_v32uhi, __gcc_v32hf, unsigned int, int)
__gcc_v2di __builtin_ia32_vpconflictdi_128(__gcc_v2di)
__gcc_v4sf __builtin_ia32_gatherd_ps(__gcc_v4sf, const float *, __gcc_v4si, __gcc_v4sf, char)
__gcc_v64qi __builtin_ia32_vpermi2varqi512(__gcc_v64qi, __gcc_v64qi, __gcc_v64qi)
__gcc_v2df __builtin_ia32_rcp28sd_round_mask(__gcc_v2df, __gcc_v2df, __gcc_v2df, unsigned char, int)
__gcc_v8di __builtin_ia32_prorq512(__gcc_v8di, int)
__gcc_v2di __builtin_ia32_prorq128(__gcc_v2di, int)
__gcc_v32hi __builtin_ia32_vpshrdvw512(__gcc_v32hi, __gcc_v32hi, __gcc_v32hi)
__gcc_v16sf __builtin_ia32_vfcmulcph512_mask(__gcc_v16sf, __gcc_v16sf, __gcc_v16sf, unsigned short, int)
float __builtin_ia32_reduce_fmul_ps512(float, __gcc_v16sf)
__gcc_v16sf __builtin_ia32_vfmaddcph512_mask3(__gcc_v16sf, __gcc_v16sf, __gcc_v16sf, unsigned short, int)
__gcc_v4sf __builtin_ia32_vcvtneeph2ps128(const __gcc_v8hf *)
__gcc_v8df __builtin_ia32_minpd512(__gcc_v8df, __gcc_v8df, int)
__gcc_v16hf __builtin_ia32_selectpbf_256(unsigned short, __gcc_v16hf, __gcc_v16hf)
__gcc_v4sf __builtin_ia32_rangess128_round_mask(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int, int)
__gcc_v4si __builtin_ia32_vpshldd128(__gcc_v4si, __gcc_v4si, int)
__gcc_v64qi __builtin_ia32_pshufb512(__gcc_v64qi, __gcc_v64qi)
__gcc_v4si __builtin_ia32_vpdpwssd128(__gcc_v4si, __gcc_v4si, __gcc_v4si)
__gcc_v4sf __builtin_ia32_vfmaddcsh_maskz(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int)
__gcc_v32hi __builtin_ia32_psllwi512(__gcc_v32hi, int)
__gcc_v4di __builtin_ia32_vpmadd52huq256(__gcc_v4di, __gcc_v4di, __gcc_v4di)
__gcc_v8hi __builtin_ia32_permvarhi128(__gcc_v8hi, __gcc_v8hi)
__gcc_v4sf __builtin_ia32_vfcmaddcsh_maskz(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int)
__gcc_v2di __builtin_ia32_vpmadd52luq128(__gcc_v2di, __gcc_v2di, __gcc_v2di)
__gcc_v32hi __builtin_ia32_pshufhw512(__gcc_v32hi, int)
__gcc_v4di __builtin_ia32_prorvq256(__gcc_v4di, __gcc_v4di)
__gcc_v16qi __builtin_ia32_vpmultishiftqb128(__gcc_v16qi, __gcc_v16qi)
__gcc_v8si __builtin_ia32_vpdpwssd256(__gcc_v8si, __gcc_v8si, __gcc_v8si)
__gcc_v4sf __builtin_ia32_subss_round_mask(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int)
__gcc_v32qi __builtin_ia32_vpopcntb_256(__gcc_v32qi)
__gcc_v4si __builtin_ia32_vpdpbusd128(__gcc_v4si, __gcc_v4si, __gcc_v4si)
__gcc_v8di __builtin_ia32_vpshldvq512(__gcc_v8di, __gcc_v8di, __gcc_v8di)
__gcc_v16hi __builtin_ia32_vpopcntw_256(__gcc_v16hi)
__gcc_v16hf __builtin_ia32_vfmaddph256(__gcc_v16hf, __gcc_v16hf, __gcc_v16hf)
__gcc_v32hf __builtin_ia32_scalefph512_mask(__gcc_v32hf, __gcc_v32hf, __gcc_v32hf, unsigned int, int)
float __builtin_ia32_reduce_fmax_ps512(__gcc_v16sf)
__gcc_v4di __builtin_ia32_vpconflictdi_256(__gcc_v4di)
__gcc_v16hi __builtin_ia32_vpermi2varhi256(__gcc_v16hi, __gcc_v16hi, __gcc_v16hi)
__gcc_v4si __builtin_ia32_vpopcntd_128(__gcc_v4si)
__gcc_v32hi __builtin_ia32_psrav32hi(__gcc_v32hi, __gcc_v32hi)
__gcc_v16si __builtin_ia32_vpshrdd512(__gcc_v16si, __gcc_v16si, int)
__gcc_v16sf __builtin_ia32_shuf_f32x4(__gcc_v16sf, __gcc_v16sf, int)
__gcc_v16si __builtin_ia32_inserti32x4(__gcc_v16si, __gcc_v4si, int)
__gcc_v16qi __builtin_ia32_vprotbi(__gcc_v16qi, char)
__gcc_v64qi __builtin_ia32_permvarqi512(__gcc_v64qi, __gcc_v64qi)
__gcc_v8df __builtin_ia32_permvardf512(__gcc_v8df, __gcc_v8di)
__gcc_v16hf __builtin_ia32_maxph256(__gcc_v16hf, __gcc_v16hf)
__gcc_v8hi __builtin_ia32_vpcomw(__gcc_v8hi, __gcc_v8hi, char)
__gcc_v16usi __builtin_ia32_vcvtph2udq512_mask(__gcc_v16hf, __gcc_v16usi, unsigned short, int)
__gcc_v2df __builtin_ia32_scalefsd_round_mask(__gcc_v2df, __gcc_v2df, __gcc_v2df, unsigned char, int)
__gcc_v32qi __builtin_ia32_vpermi2varqi256(__gcc_v32qi, __gcc_v32qi, __gcc_v32qi)
__gcc_v8di __builtin_ia32_aesenc512(__gcc_v8di, __gcc_v8di)
__gcc_v16si __builtin_ia32_vplzcntd_512(__gcc_v16si)
__gcc_v8sf __builtin_ia32_vcvtneobf162ps256(const __gcc_v16hf *)
__gcc_v16si __builtin_ia32_pslldi512(__gcc_v16si, int)
__gcc_v8si __builtin_ia32_vpdpbssds256(__gcc_v8si, __gcc_v8si, __gcc_v8si)
__gcc_v2di __builtin_ia32_prolvq128(__gcc_v2di, __gcc_v2di)
__gcc_v8hf __builtin_ia32_selectsbf_128(unsigned char, __gcc_v8hf, __gcc_v8hf)
__gcc_v32qi __builtin_ia32_permvarqi256(__gcc_v32qi, __gcc_v32qi)
__gcc_v2di __builtin_ia32_vpshrdq128(__gcc_v2di, __gcc_v2di, int)
__gcc_v32hi __builtin_ia32_pmulhrsw512(__gcc_v32hi, __gcc_v32hi)
__gcc_v8hf __builtin_ia32_vcvtss2sh_round_mask(__gcc_v8hf, __gcc_v4sf, __gcc_v8hf, unsigned char, int)
__gcc_v4di __builtin_ia32_vpshrdq256(__gcc_v4di, __gcc_v4di, int)
__gcc_v256si __builtin_ia32_tdpfp16ps_internal(unsigned short, unsigned short, unsigned short, __gcc_v256si, __gcc_v256si, __gcc_v256si)
unsigned char __builtin_ia32_cmpph128_mask(__gcc_v8hf, __gcc_v8hf, int, unsigned char)
__gcc_v8hf __builtin_ia32_vcvtneps2bf16128(__gcc_v4sf)
_Float16 __builtin_ia32_reduce_fmul_ph512(_Float16, __gcc_v32hf)
__gcc_v8di __builtin_ia32_vplzcntq_512(__gcc_v8di)
__gcc_v16si __builtin_ia32_vpdpwssd512(__gcc_v16si, __gcc_v16si, __gcc_v16si)
__gcc_v2di __builtin_ia32_vpermi2varq128(__gcc_v2di, __gcc_v2di, __gcc_v2di)
__gcc_v4si __builtin_ia32_vpcomud(__gcc_v4si, __gcc_v4si, char)
__gcc_v2di __builtin_ia32_prolq128(__gcc_v2di, int)
__gcc_v16si __builtin_ia32_vpopcntd_512(__gcc_v16si)
__gcc_v8hf __builtin_ia32_sqrtsh_round_mask(__gcc_v8hf, __gcc_v8hf, __gcc_v8hf, unsigned char, int)
__gcc_v16qi __builtin_ia32_vpcomb(__gcc_v16qi, __gcc_v16qi, char)
__gcc_v4si __builtin_ia32_vpdpbssd128(__gcc_v4si, __gcc_v4si, __gcc_v4si)
__gcc_v16sf __builtin_ia32_vfmaddcph512_maskz(__gcc_v16sf, __gcc_v16sf, __gcc_v16sf, unsigned short, int)
__gcc_v4sf __builtin_ia32_vfcmaddcsh_mask(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int)
void __builtin_ia32_compressstoreqi256_mask(__gcc_v32qi *, __gcc_v32qi, unsigned int)
_Float16 __builtin_ia32_reduce_fadd_ph512(_Float16, __gcc_v32hf)
__gcc_v2di __builtin_ia32_psravq128(__gcc_v2di, __gcc_v2di)
__gcc_v4sf __builtin_ia32_rsqrt28ss_round_mask(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int)
long long int __builtin_ia32_vcvtsh2si64(__gcc_v8hf, int)
__gcc_v8si __builtin_ia32_vpdpbusds256(__gcc_v8si, __gcc_v8si, __gcc_v8si)
__gcc_v16sf __builtin_ia32_vcvtph2psx512_mask(__gcc_v16hf, __gcc_v16sf, unsigned short, int)
__gcc_v2di __builtin_ia32_vpshldvq128(__gcc_v2di, __gcc_v2di, __gcc_v2di)
__gcc_v8di __builtin_ia32_aesdeclast512(__gcc_v8di, __gcc_v8di)
__gcc_v16si __builtin_ia32_alignd512(__gcc_v16si, __gcc_v16si, int)
__gcc_v8df __builtin_ia32_subpd512(__gcc_v8df, __gcc_v8df, int)
__gcc_v16si __builtin_ia32_psrav16si(__gcc_v16si, __gcc_v16si)
__gcc_v8hf __builtin_ia32_vfmaddsubph(__gcc_v8hf, __gcc_v8hf, __gcc_v8hf)
__gcc_v8hf __builtin_ia32_vcvtqq2ph512_mask(__gcc_v8di, __gcc_v8hf, unsigned char, int)
__gcc_v16si __builtin_ia32_vpdpbusds512(__gcc_v16si, __gcc_v16si, __gcc_v16si)
__gcc_v16qi __builtin_ia32_vpcomub(__gcc_v16qi, __gcc_v16qi, char)
__gcc_v16hi __builtin_ia32_psrlv16hi(__gcc_v16hi, __gcc_v16hi)
__gcc_v4di __builtin_ia32_shuf_i64x2_256(__gcc_v4di, __gcc_v4di, int)
void __builtin_ia32_aor32(void *, signed int)
__gcc_v4sf __builtin_ia32_divss_round_mask(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int)
__gcc_v4sf __builtin_ia32_minss_round_mask(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int)
__gcc_v16si __builtin_ia32_psradi512(__gcc_v16si, int)
__gcc_v8di __builtin_ia32_vpshldq512(__gcc_v8di, __gcc_v8di, int)
__gcc_v8df __builtin_ia32_permdf512(__gcc_v8df, int)
void __builtin_ia32_invpcid(unsigned int, void *)
__gcc_v8df __builtin_ia32_maxpd512(__gcc_v8df, __gcc_v8df, int)
__gcc_v8di __builtin_ia32_psrlv8di(__gcc_v8di, __gcc_v8di)
_Float16 __builtin_ia32_reduce_fmul_ph128(_Float16, __gcc_v8hf)
__gcc_v4di __builtin_ia32_selectq_256(unsigned char, __gcc_v4di, __gcc_v4di)
__gcc_v8df __builtin_ia32_addpd512(__gcc_v8df, __gcc_v8df, int)
__gcc_v16sf __builtin_ia32_maxps512(__gcc_v16sf, __gcc_v16sf, int)
__gcc_v2df __builtin_ia32_loadsd128_mask(const __gcc_v2df *, __gcc_v2df, unsigned char)
__gcc_v2di __builtin_ia32_gatherd_q(__gcc_v2di, const long long int *, __gcc_v4si, __gcc_v2di, char)
void __builtin_ia32_aadd64(void *, signed long long int)
__gcc_v8si __builtin_ia32_vpshldvd256(__gcc_v8si, __gcc_v8si, __gcc_v8si)
__gcc_v4df __builtin_ia32_shuf_f64x2_256(__gcc_v4df, __gcc_v4df, int)
__gcc_v4sf __builtin_ia32_gatherq_ps256(__gcc_v4sf, const float *, __gcc_v4di, __gcc_v4sf, char)
__gcc_v8hf __builtin_ia32_mulsh_round_mask(__gcc_v8hf, __gcc_v8hf, __gcc_v8hf, unsigned char, int)
__gcc_v8si __builtin_ia32_vpdpbsuds256(__gcc_v8si, __gcc_v8si, __gcc_v8si)
__gcc_v32qi __builtin_ia32_vec_set_v32qi(__gcc_v32qi, char, int)
__gcc_v16sf __builtin_ia32_vfcmaddcph512_mask(__gcc_v16sf, __gcc_v16sf, __gcc_v16sf, unsigned short, int)
__gcc_v8di __builtin_ia32_permdi512(__gcc_v8di, int)
__gcc_v64qi __builtin_ia32_vpmultishiftqb512(__gcc_v64qi, __gcc_v64qi)
__gcc_v2di __builtin_ia32_vpmadd52huq128(__gcc_v2di, __gcc_v2di, __gcc_v2di)
__gcc_v8di __builtin_ia32_vcvtph2qq512_mask(__gcc_v8hf, __gcc_v8di, unsigned char, int)
long long int __builtin_ia32_vcvttsh2si64(__gcc_v8hf, int)
__gcc_v4di __builtin_ia32_psraq256(__gcc_v4di, __gcc_v2di)
__gcc_v8hf __builtin_ia32_divsh_round_mask(__gcc_v8hf, __gcc_v8hf, __gcc_v8hf, unsigned char, int)
unsigned int __builtin_ia32_rdseed32_step(unsigned int *)
__gcc_v8di __builtin_ia32_prolq512(__gcc_v8di, int)
__gcc_v32hi __builtin_ia32_vcvttph2w512_mask(__gcc_v32hf, __gcc_v32hi, unsigned int, int)
__gcc_v4si __builtin_ia32_prold128(__gcc_v4si, int)
__gcc_v8hi __builtin_ia32_psrlv8hi(__gcc_v8hi, __gcc_v8hi)
__gcc_v8di __builtin_ia32_pslldqi512_byteshift(__gcc_v8di, int)
__gcc_v16sf __builtin_ia32_vfcmaddcph512_mask3(__gcc_v16sf, __gcc_v16sf, __gcc_v16sf, unsigned short, int)
__gcc_v2di __builtin_ia32_vpcomq(__gcc_v2di, __gcc_v2di, char)
__gcc_v4sf __builtin_ia32_vbcstnesh2ps128(const _Float16 *)
__gcc_v8sf __builtin_ia32_shuf_f32x4_256(__gcc_v8sf, __gcc_v8sf, int)
_Float16 __builtin_ia32_reduce_fmin_ph512(__gcc_v32hf)
__gcc_v4si __builtin_ia32_vpdpbuud128(__gcc_v4si, __gcc_v4si, __gcc_v4si)
unsigned int __builtin_ia32_rdseed64_step(unsigned long long int *)
__gcc_v8si __builtin_ia32_vpdpbuuds256(__gcc_v8si, __gcc_v8si, __gcc_v8si)
__gcc_v8hf __builtin_ia32_loadsh128_mask(const __gcc_v8hf *, __gcc_v8hf, unsigned char)
__gcc_v16hi __builtin_ia32_psrav16hi(__gcc_v16hi, __gcc_v16hi)
__gcc_v8hf __builtin_ia32_rndscalesh_round_mask(__gcc_v8hf, __gcc_v8hf, __gcc_v8hf, unsigned char, int, int)
__gcc_v16usi __builtin_ia32_vcvttph2udq512_mask(__gcc_v16hf, __gcc_v16usi, unsigned short, int)
__gcc_v8di __builtin_ia32_vpconflictdi_512(__gcc_v8di)
__gcc_v8hf __builtin_ia32_addsh_round_mask(__gcc_v8hf, __gcc_v8hf, __gcc_v8hf, unsigned char, int)
__gcc_v32hf __builtin_ia32_selectpbf_512(unsigned int, __gcc_v32hf, __gcc_v32hf)
float __builtin_ia32_reduce_fmin_ps512(__gcc_v16sf)
__gcc_v16si __builtin_ia32_vpdpwssds512(__gcc_v16si, __gcc_v16si, __gcc_v16si)
__gcc_v8si __builtin_ia32_inserti32x4_256(__gcc_v8si, __gcc_v4si, int)
__gcc_v8di __builtin_ia32_psllv8di(__gcc_v8di, __gcc_v8di)
__gcc_v4sf __builtin_ia32_vfmaddcsh_round_mask(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int)
__gcc_v16qi __builtin_ia32_permvarqi128(__gcc_v16qi, __gcc_v16qi)
__gcc_v4sf __builtin_ia32_vcvtneobf162ps128(const __gcc_v8hf *)
__gcc_v8si __builtin_ia32_vpconflictsi_256(__gcc_v8si)
__gcc_v32hi __builtin_ia32_pmulhw512(__gcc_v32hi, __gcc_v32hi)
__gcc_v8hi __builtin_ia32_vpshrdw128(__gcc_v8hi, __gcc_v8hi, int)
short __builtin_ia32_vec_ext_v16hi(__gcc_v16hi, int)
__gcc_v32hi __builtin_ia32_permvarhi512(__gcc_v32hi, __gcc_v32hi)
__gcc_v8sf __builtin_ia32_vbcstnebf162ps256(const _Float16 *)
__gcc_v16hi __builtin_ia32_vpshrdvw256(__gcc_v16hi, __gcc_v16hi, __gcc_v16hi)
__gcc_v4di __builtin_ia32_vpopcntq_256(__gcc_v4di)
__gcc_v8di __builtin_ia32_permvardi512(__gcc_v8di, __gcc_v8di)
__gcc_v8hf __builtin_ia32_selectsh_128(unsigned char, __gcc_v8hf, __gcc_v8hf)
__gcc_v32hf __builtin_ia32_addph512(__gcc_v32hf, __gcc_v32hf, int)
__gcc_v4si __builtin_ia32_gatherq_d256(__gcc_v4si, const int *, __gcc_v4di, __gcc_v4si, char)
__gcc_v8di __builtin_ia32_psraqi512(__gcc_v8di, int)
__gcc_v4sf __builtin_ia32_vfmulcsh_mask(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int)
__gcc_v16sf __builtin_ia32_subps512(__gcc_v16sf, __gcc_v16sf, int)
__gcc_v2df __builtin_ia32_getexpsd128_round_mask(__gcc_v2df, __gcc_v2df, __gcc_v2df, unsigned char, int)
__gcc_v4sf __builtin_ia32_vbcstnebf162ps128(const _Float16 *)
__gcc_v4si __builtin_ia32_vpconflictsi_128(__gcc_v4si)
_Float16 __builtin_ia32_reduce_fmax_ph512(__gcc_v32hf)
__gcc_v16si __builtin_ia32_psrad512(__gcc_v16si, __gcc_v4si)
__gcc_v32hi __builtin_ia32_packssdw512(__gcc_v16si, __gcc_v16si)
__gcc_v8di __builtin_ia32_vpmadd52huq512(__gcc_v8di, __gcc_v8di, __gcc_v8di)
unsigned long long int __builtin_ia32_vcvttsh2usi64(__gcc_v8hf, int)
__gcc_v8sf __builtin_ia32_gatherd_ps256(__gcc_v8sf, const float *, __gcc_v8si, __gcc_v8sf, char)
__gcc_v8hf __builtin_ia32_maxsh_round_mask(__gcc_v8hf, __gcc_v8hf, __gcc_v8hf, unsigned char, int)
__gcc_v64qi __builtin_ia32_pavgb512(__gcc_v64qi, __gcc_v64qi)
__gcc_v8df __builtin_ia32_divpd512(__gcc_v8df, __gcc_v8df, int)
__gcc_v16hi __builtin_ia32_vpshldvw256(__gcc_v16hi, __gcc_v16hi, __gcc_v16hi)
__gcc_v4sf __builtin_ia32_rcp28ss_round_mask(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int)
unsigned short __builtin_ia32_cmpph256_mask(__gcc_v16hf, __gcc_v16hf, int, unsigned short)
__gcc_v2df __builtin_ia32_divsd_round_mask(__gcc_v2df, __gcc_v2df, __gcc_v2df, unsigned char, int)
__gcc_v4di __builtin_ia32_vec_set_v4di(__gcc_v4di, long long int, int)
__gcc_v2df __builtin_ia32_minsd_round_mask(__gcc_v2df, __gcc_v2df, __gcc_v2df, unsigned char, int)
__gcc_v32hf __builtin_ia32_divph512(__gcc_v32hf, __gcc_v32hf, int)
__gcc_v8di __builtin_ia32_inserti64x2_512(__gcc_v8di, __gcc_v2di, int)
__gcc_v8di __builtin_ia32_psllqi512(__gcc_v8di, int)
void __builtin_ia32_writeeflags_u32(unsigned int)
__gcc_v8di __builtin_ia32_prolvq512(__gcc_v8di, __gcc_v8di)
signed int __builtin_ia32_cmpccxadd32(void *, signed int, signed int, int)
__gcc_v8hi __builtin_ia32_vpshrdvw128(__gcc_v8hi, __gcc_v8hi, __gcc_v8hi)
__gcc_v4di __builtin_ia32_vpshldvq256(__gcc_v4di, __gcc_v4di, __gcc_v4di)
__gcc_v16sf __builtin_ia32_minps512(__gcc_v16sf, __gcc_v16sf, int)
__gcc_v8hi __builtin_ia32_vpopcntw_128(__gcc_v8hi)
__gcc_v16si __builtin_ia32_inserti32x8(__gcc_v16si, __gcc_v8si, int)
__gcc_v4di __builtin_ia32_prorq256(__gcc_v4di, int)
__gcc_v32hi __builtin_ia32_packusdw512(__gcc_v16si, __gcc_v16si)
__gcc_v2df __builtin_ia32_gatherq_pd(__gcc_v2df, const double *, __gcc_v2di, __gcc_v2df, char)
unsigned long long int __builtin_ia32_rdpru(int)
__gcc_v32hi __builtin_ia32_psrlv32hi(__gcc_v32hi, __gcc_v32hi)
__gcc_v32hf __builtin_ia32_minph512(__gcc_v32hf, __gcc_v32hf, int)
__gcc_v16si __builtin_ia32_psrlv16si(__gcc_v16si, __gcc_v16si)
__gcc_v8hf __builtin_ia32_reducesh_mask(__gcc_v8hf, __gcc_v8hf, __gcc_v8hf, unsigned char, int, int)
void __builtin_ia32_directstore_u64(unsigned long int *, unsigned long int)
__gcc_v16sf __builtin_ia32_vfcmaddcph512_maskz(__gcc_v16sf, __gcc_v16sf, __gcc_v16sf, unsigned short, int)
__gcc_v2df __builtin_ia32_maxsd_round_mask(__gcc_v2df, __gcc_v2df, __gcc_v2df, unsigned char, int)
__gcc_v32hi __builtin_ia32_dbpsadbw512(__gcc_v64qi, __gcc_v64qi, int)
__gcc_v8df __builtin_ia32_insertf64x2_512(__gcc_v8df, __gcc_v2df, int)
__gcc_v16si __builtin_ia32_prold512(__gcc_v16si, int)
__gcc_v8df __builtin_ia32_vpermilvarpd512(__gcc_v8df, __gcc_v8di)
__gcc_v2di __builtin_ia32_vpcomuq(__gcc_v2di, __gcc_v2di, char)
__gcc_v8hf __builtin_ia32_scalefsh_round_mask(__gcc_v8hf, __gcc_v8hf, __gcc_v8hf, unsigned char, int)
__gcc_v32hi __builtin_ia32_psrawi512(__gcc_v32hi, int)
__gcc_v2di __builtin_ia32_pslldqi128_byteshift(__gcc_v2di, int)
__gcc_v8si __builtin_ia32_vpdpwssds256(__gcc_v8si, __gcc_v8si, __gcc_v8si)
__gcc_v16si __builtin_ia32_vcvttph2dq512_mask(__gcc_v16hf, __gcc_v16si, unsigned short, int)
__gcc_v64qi __builtin_ia32_packuswb512(__gcc_v32hi, __gcc_v32hi)
_Float16 __builtin_ia32_reduce_fmin_ph128(__gcc_v8hf)
__gcc_v16sf __builtin_ia32_vpermilvarps512(__gcc_v16sf, __gcc_v16si)
void __builtin_ia32_vp2intersect_q_256(__gcc_v4di, __gcc_v4di, unsigned char *, unsigned char *)
__gcc_v16hf __builtin_ia32_vcvtdq2ph512_mask(__gcc_v16si, __gcc_v16hf, unsigned short, int)
__gcc_v4sf __builtin_ia32_vfmaddcsh_mask(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int)
__gcc_v32hi __builtin_ia32_vcvtph2w512_mask(__gcc_v32hf, __gcc_v32hi, unsigned int, int)
__gcc_v16hi __builtin_ia32_vec_set_v16hi(__gcc_v16hi, short, int)
void __builtin_ia32_vp2intersect_q_512(__gcc_v8di, __gcc_v8di, unsigned char *, unsigned char *)
__gcc_v8df __builtin_ia32_shufpd512(__gcc_v8df, __gcc_v8df, int)
__gcc_v4sf __builtin_ia32_rndscaless_round_mask(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int, int)
__gcc_v4si __builtin_ia32_vplzcntd_128(__gcc_v4si)
__gcc_v16si __builtin_ia32_psrld512(__gcc_v16si, __gcc_v4si)
__gcc_v8hi __builtin_ia32_dbpsadbw128(__gcc_v16qi, __gcc_v16qi, int)
__gcc_v4di __builtin_ia32_vpshldq256(__gcc_v4di, __gcc_v4di, int)
__gcc_v4sf __builtin_ia32_vfcmaddcsh_round_mask(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int)
__gcc_v8si __builtin_ia32_shuf_i32x4_256(__gcc_v8si, __gcc_v8si, int)
__gcc_v4si __builtin_ia32_vpdpbsud128(__gcc_v4si, __gcc_v4si, __gcc_v4si)
__gcc_v8sf __builtin_ia32_vcvtneeph2ps256(const __gcc_v16hf *)
__gcc_v2df __builtin_ia32_vpermi2varpd128(__gcc_v2df, __gcc_v2di, __gcc_v2df)
__gcc_v4si __builtin_ia32_vpdpwssds128(__gcc_v4si, __gcc_v4si, __gcc_v4si)
__gcc_v4sf __builtin_ia32_loadss128_mask(const __gcc_v4sf *, __gcc_v4sf, unsigned char)
__gcc_v16hf __builtin_ia32_vfmaddsubph256(__gcc_v16hf, __gcc_v16hf, __gcc_v16hf)
__gcc_v8sf __builtin_ia32_vcvtneebf162ps256(const __gcc_v16hf *)
__gcc_v8di __builtin_ia32_vpmadd52luq512(__gcc_v8di, __gcc_v8di, __gcc_v8di)
__gcc_v16si __builtin_ia32_pshufd512(__gcc_v16si, int)
__gcc_v8si __builtin_ia32_vpermi2vard256(__gcc_v8si, __gcc_v8si, __gcc_v8si)
__gcc_v16si __builtin_ia32_vpshrdvd512(__gcc_v16si, __gcc_v16si, __gcc_v16si)
__gcc_v4si __builtin_ia32_vpshldvd128(__gcc_v4si, __gcc_v4si, __gcc_v4si)
__gcc_v16sf __builtin_ia32_insertf32x8(__gcc_v16sf, __gcc_v8sf, int)
__gcc_v8di __builtin_ia32_psraq512(__gcc_v8di, __gcc_v2di)
__gcc_v4di __builtin_ia32_psraqi256(__gcc_v4di, int)
__gcc_v4di __builtin_ia32_aesenc256(__gcc_v4di, __gcc_v4di)
__gcc_v8si __builtin_ia32_prolvd256(__gcc_v8si, __gcc_v8si)
__gcc_v4di __builtin_ia32_alignq256(__gcc_v4di, __gcc_v4di, int)
void __builtin_ia32_aor64(void *, signed long long int)
__gcc_v4sf __builtin_ia32_vcvtneebf162ps128(const __gcc_v8hf *)
__gcc_v8hf __builtin_ia32_minph128(__gcc_v8hf, __gcc_v8hf)
__gcc_v8di __builtin_ia32_pmuludq512(__gcc_v16si, __gcc_v16si)
__gcc_v32hf __builtin_ia32_selectph_512(unsigned int, __gcc_v32hf, __gcc_v32hf)
__gcc_v8hi __builtin_ia32_vpshldw128(__gcc_v8hi, __gcc_v8hi, int)
__gcc_v8hf __builtin_ia32_vcvtpd2ph512_mask(__gcc_v8df, __gcc_v8hf, unsigned char, int)
__gcc_v8sf __builtin_ia32_vcvtneoph2ps256(const __gcc_v16hf *)
__gcc_v32hf __builtin_ia32_sqrtph512(__gcc_v32hf, int)
__gcc_v2di __builtin_ia32_gatherq_q(__gcc_v2di, const long long int *, __gcc_v2di, __gcc_v2di, char)
void __builtin_ia32_compressstorehi512_mask(__gcc_v32hi *, __gcc_v32hi, unsigned int)
__gcc_v32hi __builtin_ia32_psraw512(__gcc_v32hi, __gcc_v8hi)
__gcc_v8di __builtin_ia32_psrlqi512(__gcc_v8di, int)
__gcc_v8di __builtin_ia32_psrlq512(__gcc_v8di, __gcc_v2di)
__gcc_v4sf __builtin_ia32_addss_round_mask(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int)
__gcc_v8si __builtin_ia32_vpshrdd256(__gcc_v8si, __gcc_v8si, int)
__gcc_v8hi __builtin_ia32_vpcomuw(__gcc_v8hi, __gcc_v8hi, char)
__gcc_v4si __builtin_ia32_vpdpbsuds128(__gcc_v4si, __gcc_v4si, __gcc_v4si)
__gcc_v4df __builtin_ia32_permvardf256(__gcc_v4df, __gcc_v4di)
double __builtin_ia32_reduce_fmul_pd512(double, __gcc_v8df)
__gcc_v4sf __builtin_ia32_getmantss_round_mask(__gcc_v4sf, __gcc_v4sf, int, __gcc_v4sf, unsigned char, int)
__gcc_v8hf __builtin_ia32_sqrtph(__gcc_v8hf)
__gcc_v8df __builtin_ia32_shuf_f64x2(__gcc_v8df, __gcc_v8df, int)
__gcc_v4si __builtin_ia32_vpdpbusds128(__gcc_v4si, __gcc_v4si, __gcc_v4si)
__gcc_v16hf __builtin_ia32_vcvtudq2ph512_mask(__gcc_v16usi, __gcc_v16hf, unsigned short, int)
__gcc_v32hi __builtin_ia32_vpshldw512(__gcc_v32hi, __gcc_v32hi, int)
__gcc_v4sf __builtin_ia32_scalefss_round_mask(__gcc_v4sf, __gcc_v4sf, __gcc_v4sf, unsigned char, int)
__gcc_v16si __builtin_ia32_vpshldvd512(__gcc_v16si, __gcc_v16si, __gcc_v16si)
__gcc_v8di __builtin_ia32_shuf_i64x2(__gcc_v8di, __gcc_v8di, int)
__gcc_v16si __builtin_ia32_permvarsi512(__gcc_v16si, __gcc_v16si)
__gcc_v16hf __builtin_ia32_rndscaleph_256_mask(__gcc_v16hf, int, __gcc_v16hf, unsigned short)
__gcc_v8df __builtin_ia32_vcvtph2pd512_mask(__gcc_v8hf, __gcc_v8df, unsigned char, int)
__gcc_v16si __builtin_ia32_psrldi512(__gcc_v16si, int)
unsigned int __builtin_ia32_vcvtsh2usi32(__gcc_v8hf, int)
__gcc_v32hf __builtin_ia32_subph512(__gcc_v32hf, __gcc_v32hf, int)
__gcc_v8di __builtin_ia32_prorvq512(__gcc_v8di, __gcc_v8di)
int __builtin_ia32_vcomish(__gcc_v8hf, __gcc_v8hf, int, int)
__gcc_v2di __builtin_ia32_vpshldq128(__gcc_v2di, __gcc_v2di, int)
__gcc_v32hf __builtin_ia32_mulph512(__gcc_v32hf, __gcc_v32hf, int)
_Float16 __builtin_ia32_reduce_fmax_ph256(__gcc_v16hf)
__gcc_v16si __builtin_ia32_pslld512(__gcc_v16si, __gcc_v4si)
__gcc_v16hf __builtin_ia32_vcvtps2phx512_mask(__gcc_v16sf, __gcc_v16hf, unsigned short, int)
__gcc_v8si __builtin_ia32_vpshldd256(__gcc_v8si, __gcc_v8si, int)
void __builtin_ia32_compressstorehi256_mask(__gcc_v16hi *, __gcc_v16hi, unsigned short)
unsigned char __builtin_ia32_cmpsh_mask(__gcc_v8hf, __gcc_v8hf, int, unsigned char, int)
__gcc_v4di __builtin_ia32_prolvq256(__gcc_v4di, __gcc_v4di)
__gcc_v2df __builtin_ia32_subsd_round_mask(__gcc_v2df, __gcc_v2df, __gcc_v2df, unsigned char, int)
void __builtin_ia32_compressstoreqi512_mask(__gcc_v64qi *, __gcc_v64qi, unsigned long long int)
__gcc_v16si __builtin_ia32_prord512(__gcc_v16si, int)
__gcc_v4df __builtin_ia32_vpermi2varpd256(__gcc_v4df, __gcc_v4di, __gcc_v4df)
__gcc_v8di __builtin_ia32_pmuldq512(__gcc_v16si, __gcc_v16si)
__gcc_v8hi __builtin_ia32_vpermi2varhi128(__gcc_v8hi, __gcc_v8hi, __gcc_v8hi)
__gcc_v8di __builtin_ia32_vpshrdvq512(__gcc_v8di, __gcc_v8di, __gcc_v8di)
__gcc_v16hi __builtin_ia32_dbpsadbw256(__gcc_v32qi, __gcc_v32qi, int)
__gcc_v8df __builtin_ia32_mulpd512(__gcc_v8df, __gcc_v8df, int)
__gcc_v8di __builtin_ia32_vpopcntq_512(__gcc_v8di)
__gcc_v4di __builtin_ia32_pslldqi256_byteshift(__gcc_v4di, int)
__gcc_v16si __builtin_ia32_vpdpbusd512(__gcc_v16si, __gcc_v16si, __gcc_v16si)
__gcc_v4di __builtin_ia32_pclmulqdq256(__gcc_v4di, __gcc_v4di, char)
__gcc_v32hi __builtin_ia32_pavgw512(__gcc_v32hi, __gcc_v32hi)
__gcc_v16si __builtin_ia32_vpermi2vard512(__gcc_v16si, __gcc_v16si, __gcc_v16si)
void __builtin_ia32_storesd128_mask(__gcc_v2df *, __gcc_v2df, unsigned char)
__gcc_v16si __builtin_ia32_shuf_i32x4(__gcc_v16si, __gcc_v16si, int)
__gcc_v32hi __builtin_ia32_vpermi2varhi512(__gcc_v32hi, __gcc_v32hi, __gcc_v32hi)
__gcc_v16si __builtin_ia32_prorvd512(__gcc_v16si, __gcc_v16si)
void __builtin_ia32_axor32(void *, signed int)
void __builtin_ia32_directstore_u32(unsigned int *, unsigned int)
__gcc_v4di __builtin_ia32_aesenclast256(__gcc_v4di, __gcc_v4di)
__gcc_v32hi __builtin_ia32_vpopcntw_512(__gcc_v32hi)
__gcc_v4sf __builtin_ia32_vcvtneoph2ps128(const __gcc_v8hf *)
__gcc_v8si __builtin_ia32_vec_set_v8si(__gcc_v8si, int, int)
__gcc_v8hf __builtin_ia32_subsh_round_mask(__gcc_v8hf, __gcc_v8hf, __gcc_v8hf, unsigned char, int)
void __builtin_ia32_prefetchi(const void *, unsigned int)
__gcc_v32hf __builtin_ia32_rndscaleph_mask(__gcc_v32hf, int, __gcc_v32hf, unsigned int, int)
__gcc_v16hi __builtin_ia32_psllv16hi(__gcc_v16hi, __gcc_v16hi)
__gcc_v8df __builtin_ia32_vpermi2varpd512(__gcc_v8df, __gcc_v8di, __gcc_v8df)
__gcc_v8si __builtin_ia32_prord256(__gcc_v8si, int)
__gcc_v2df __builtin_ia32_sqrtsd_round_mask(__gcc_v2df, __gcc_v2df, __gcc_v2df, unsigned char, int)
__gcc_v8hi __builtin_ia32_vpshldvw128(__gcc_v8hi, __gcc_v8hi, __gcc_v8hi)
__gcc_v16qi __builtin_ia32_vpermi2varqi128(__gcc_v16qi, __gcc_v16qi, __gcc_v16qi)
signed long long int __builtin_ia32_cmpccxadd64(void *, signed long long int, signed long long int, int)
__gcc_v8si __builtin_ia32_gatherd_d256(__gcc_v8si, const int *, __gcc_v8si, __gcc_v8si, char)
int __builtin_ia32_vcvttsh2si32(__gcc_v8hf, int)
__gcc_v16si __builtin_ia32_prolvd512(__gcc_v16si, __gcc_v16si)
__gcc_v8si __builtin_ia32_vpdpbssd256(__gcc_v8si, __gcc_v8si, __gcc_v8si)
__gcc_v2df __builtin_ia32_gatherd_pd(__gcc_v2df, const double *, __gcc_v4si, __gcc_v2df, char)
void __builtin_ia32_axor64(void *, signed long long int)
__gcc_v8di __builtin_ia32_pclmulqdq512(__gcc_v8di, __gcc_v8di, char)
__gcc_v16sf __builtin_ia32_mulps512(__gcc_v16sf, __gcc_v16sf, int)