24 #error "Never use <avx512fintrin.h> directly; include <immintrin.h> instead."
27 #ifndef __AVX512FINTRIN_H
28 #define __AVX512FINTRIN_H
32 typedef long long __v8di
__attribute__((__vector_size__(64)));
37 typedef long long __m512i
__attribute__((__vector_size__(64)));
43 #define _MM_FROUND_TO_NEAREST_INT 0x00
44 #define _MM_FROUND_TO_NEG_INF 0x01
45 #define _MM_FROUND_TO_POS_INF 0x02
46 #define _MM_FROUND_TO_ZERO 0x03
47 #define _MM_FROUND_CUR_DIRECTION 0x04
50 #define __DEFAULT_FN_ATTRS __attribute__((__always_inline__, __nodebug__))
57 return (__m512i)(__v8di){ 0, 0, 0, 0, 0, 0, 0, 0 };
63 return (__m512i) __builtin_ia32_pbroadcastd512_gpr_mask (__A,
73 return (__m512i) __builtin_ia32_pbroadcastq512_gpr_mask (__A,
78 return (__m512i) __builtin_ia32_pbroadcastq512_mem_mask (__A,
88 return (__m512){ 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0,
89 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0 };
94 return (__m512d){ 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0 };
100 return (__m512){ __w, __w, __w, __w, __w, __w, __w, __w,
101 __w, __w, __w, __w, __w, __w, __w, __w };
107 return (__m512d){ __w, __w, __w, __w, __w, __w, __w, __w };
113 return (__m512i)(__v16si){ __s, __s, __s, __s, __s, __s, __s, __s,
114 __s, __s, __s, __s, __s, __s, __s, __s };
120 return (__m512i)(__v8di){ __d, __d, __d, __d, __d, __d, __d, __d };
127 return (__v16sf){ __f, __f, __f, __f,
130 __f, __f, __f, __f };
137 return (__v8df){ __d, __d, __d, __d,
138 __d, __d, __d, __d };
146 return __builtin_shufflevector(__a, __a, 0, 1, 2, 3, -1, -1, -1, -1);
152 return __builtin_shufflevector(__a, __a, 0, 1, 2, 3, 4, 5, 6, 7,
153 -1, -1, -1, -1, -1, -1, -1, -1);
159 return __builtin_shufflevector(__a, __a, 0, 1);
165 return __builtin_shufflevector(__a, __a, 0, 1, 2, 3);
178 return (__m512i) __builtin_ia32_pandd512_mask((__v16si) __a,
186 return (__m512i) __builtin_ia32_pandd512_mask((__v16si) __a,
202 return (__m512i) __builtin_ia32_pandq512_mask ((__v8di) __a,
210 return (__m512i) __builtin_ia32_pandq512_mask ((__v8di) __a,
220 return (__m512i) __builtin_ia32_pandnd512_mask ((__v16si) __A,
230 return (__m512i) __builtin_ia32_pandnd512_mask ((__v16si) __A,
239 return (__m512i) __builtin_ia32_pandnd512_mask ((__v16si) __A,
249 return (__m512i) __builtin_ia32_pandnq512_mask ((__v8di) __A,
259 return (__m512i) __builtin_ia32_pandnq512_mask ((__v8di) __A,
267 return (__m512i) __builtin_ia32_pandnq512_mask ((__v8di) __A,
282 return (__m512i) __builtin_ia32_pord512_mask((__v16si) __a,
290 return (__m512i) __builtin_ia32_pord512_mask((__v16si) __a,
306 return (__m512i) __builtin_ia32_porq512_mask ((__v8di) __a,
314 return (__m512i) __builtin_ia32_porq512_mask ((__v8di) __a,
330 return (__m512i) __builtin_ia32_pxord512_mask((__v16si) __a,
338 return (__m512i) __builtin_ia32_pxord512_mask((__v16si) __a,
354 return (__m512i) __builtin_ia32_pxorq512_mask ((__v8di) __a,
362 return (__m512i) __builtin_ia32_pxorq512_mask ((__v8di) __a,
427 return (__m512i) ((__v8di) __A + (__v8di) __B);
433 return (__m512i) __builtin_ia32_paddq512_mask ((__v8di) __A,
442 return (__m512i) __builtin_ia32_paddq512_mask ((__v8di) __A,
452 return (__m512i) ((__v8di) __A - (__v8di) __B);
458 return (__m512i) __builtin_ia32_psubq512_mask ((__v8di) __A,
467 return (__m512i) __builtin_ia32_psubq512_mask ((__v8di) __A,
477 return (__m512i) ((__v16si) __A + (__v16si) __B);
483 return (__m512i) __builtin_ia32_paddd512_mask ((__v16si) __A,
492 return (__m512i) __builtin_ia32_paddd512_mask ((__v16si) __A,
502 return (__m512i) ((__v16si) __A - (__v16si) __B);
508 return (__m512i) __builtin_ia32_psubd512_mask ((__v16si) __A,
517 return (__m512i) __builtin_ia32_psubd512_mask ((__v16si) __A,
527 return (__m512d) __builtin_ia32_maxpd512_mask ((__v8df) __A,
538 return (__m512) __builtin_ia32_maxps512_mask ((__v16sf) __A,
546 static __inline __m512i
550 return (__m512i) __builtin_ia32_pmaxsd512_mask ((__v16si) __A,
560 return (__m512i) __builtin_ia32_pmaxud512_mask ((__v16si) __A,
570 return (__m512i) __builtin_ia32_pmaxsq512_mask ((__v8di) __A,
580 return (__m512i) __builtin_ia32_pmaxuq512_mask ((__v8di) __A,
590 return (__m512d) __builtin_ia32_minpd512_mask ((__v8df) __A,
601 return (__m512) __builtin_ia32_minps512_mask ((__v16sf) __A,
609 static __inline __m512i
613 return (__m512i) __builtin_ia32_pminsd512_mask ((__v16si) __A,
623 return (__m512i) __builtin_ia32_pminud512_mask ((__v16si) __A,
633 return (__m512i) __builtin_ia32_pminsq512_mask ((__v8di) __A,
643 return (__m512i) __builtin_ia32_pminuq512_mask ((__v8di) __A,
653 return (__m512i) __builtin_ia32_pmuldq512_mask ((__v16si) __X,
663 return (__m512i) __builtin_ia32_pmuldq512_mask ((__v16si) __X,
671 return (__m512i) __builtin_ia32_pmuldq512_mask ((__v16si) __X,
681 return (__m512i) __builtin_ia32_pmuludq512_mask ((__v16si) __X,
691 return (__m512i) __builtin_ia32_pmuludq512_mask ((__v16si) __X,
699 return (__m512i) __builtin_ia32_pmuludq512_mask ((__v16si) __X,
709 return (__m512i) ((__v16si) __A * (__v16si) __B);
715 return (__m512i) __builtin_ia32_pmulld512_mask ((__v16si) __A,
725 return (__m512i) __builtin_ia32_pmulld512_mask ((__v16si) __A,
733 return (__m512d)__builtin_ia32_sqrtpd512_mask((__v8df)a,
742 return (__m512)__builtin_ia32_sqrtps512_mask((__v16sf)a,
751 return (__m512d) __builtin_ia32_rsqrt14pd512_mask ((__v8df) __A,
759 return (__m512) __builtin_ia32_rsqrt14ps512_mask ((__v16sf) __A,
768 return (__m128) __builtin_ia32_rsqrt14ss_mask ((__v4sf) __A,
778 return (__m128d) __builtin_ia32_rsqrt14sd_mask ((__v2df) __A,
788 return (__m512d) __builtin_ia32_rcp14pd512_mask ((__v8df) __A,
797 return (__m512) __builtin_ia32_rcp14ps512_mask ((__v16sf) __A,
805 return (__m128) __builtin_ia32_rcp14ss_mask ((__v4sf) __A,
815 return (__m128d) __builtin_ia32_rcp14sd_mask ((__v2df) __A,
825 return (__m512) __builtin_ia32_rndscaleps_mask ((__v16sf) __A,
834 return (__m512d) __builtin_ia32_rndscalepd_mask ((__v8df) __A,
843 return (__m512) __builtin_ia32_rndscaleps_mask ((__v16sf) __A,
852 return (__m512d) __builtin_ia32_rndscalepd_mask ((__v8df) __A,
861 return (__m512i) __builtin_ia32_pabsq512_mask ((__v8di) __A,
870 return (__m512i) __builtin_ia32_pabsd512_mask ((__v16si) __A,
876 #define _mm512_roundscale_ps(A, B) __extension__ ({ \
877 (__m512)__builtin_ia32_rndscaleps_mask((__v16sf)(A), (B), (__v16sf)(A), \
878 -1, _MM_FROUND_CUR_DIRECTION); })
880 #define _mm512_roundscale_pd(A, B) __extension__ ({ \
881 (__m512d)__builtin_ia32_rndscalepd_mask((__v8df)(A), (B), (__v8df)(A), \
882 -1, _MM_FROUND_CUR_DIRECTION); })
884 #define _mm512_fmadd_round_pd(A, B, C, R) __extension__ ({ \
885 (__m512d) __builtin_ia32_vfmaddpd512_mask ((__v8df) (A), \
886 (__v8df) (B), (__v8df) (C), \
887 (__mmask8) -1, (R)); })
890 #define _mm512_mask_fmadd_round_pd(A, U, B, C, R) __extension__ ({ \
891 (__m512d) __builtin_ia32_vfmaddpd512_mask ((__v8df) (A), \
892 (__v8df) (B), (__v8df) (C), \
893 (__mmask8) (U), (R)); })
896 #define _mm512_mask3_fmadd_round_pd(A, B, C, U, R) __extension__ ({ \
897 (__m512d) __builtin_ia32_vfmaddpd512_mask3 ((__v8df) (A), \
898 (__v8df) (B), (__v8df) (C), \
899 (__mmask8) (U), (R)); })
902 #define _mm512_maskz_fmadd_round_pd(U, A, B, C, R) __extension__ ({ \
903 (__m512d) __builtin_ia32_vfmaddpd512_maskz ((__v8df) (A), \
904 (__v8df) (B), (__v8df) (C), \
905 (__mmask8) (U), (R)); })
908 #define _mm512_fmsub_round_pd(A, B, C, R) __extension__ ({ \
909 (__m512d) __builtin_ia32_vfmaddpd512_mask ((__v8df) (A), \
910 (__v8df) (B), -(__v8df) (C), \
911 (__mmask8) -1, (R)); })
914 #define _mm512_mask_fmsub_round_pd(A, U, B, C, R) __extension__ ({ \
915 (__m512d) __builtin_ia32_vfmaddpd512_mask ((__v8df) (A), \
916 (__v8df) (B), -(__v8df) (C), \
917 (__mmask8) (U), (R)); })
920 #define _mm512_maskz_fmsub_round_pd(U, A, B, C, R) __extension__ ({ \
921 (__m512d) __builtin_ia32_vfmaddpd512_maskz ((__v8df) (A), \
922 (__v8df) (B), -(__v8df) (C), \
923 (__mmask8) (U), (R)); })
926 #define _mm512_fnmadd_round_pd(A, B, C, R) __extension__ ({ \
927 (__m512d) __builtin_ia32_vfmaddpd512_mask (-(__v8df) (A), \
928 (__v8df) (B), (__v8df) (C), \
929 (__mmask8) -1, (R)); })
932 #define _mm512_mask3_fnmadd_round_pd(A, B, C, U, R) __extension__ ({ \
933 (__m512d) __builtin_ia32_vfmaddpd512_mask3 (-(__v8df) (A), \
934 (__v8df) (B), (__v8df) (C), \
935 (__mmask8) (U), (R)); })
938 #define _mm512_maskz_fnmadd_round_pd(U, A, B, C, R) __extension__ ({ \
939 (__m512d) __builtin_ia32_vfmaddpd512_maskz (-(__v8df) (A), \
940 (__v8df) (B), (__v8df) (C), \
941 (__mmask8) (U), (R)); })
944 #define _mm512_fnmsub_round_pd(A, B, C, R) __extension__ ({ \
945 (__m512d) __builtin_ia32_vfmaddpd512_mask (-(__v8df) (A), \
946 (__v8df) (B), -(__v8df) (C), \
947 (__mmask8) -1, (R)); })
950 #define _mm512_maskz_fnmsub_round_pd(U, A, B, C, R) __extension__ ({ \
951 (__m512d) __builtin_ia32_vfmaddpd512_maskz (-(__v8df) (A), \
952 (__v8df) (B), -(__v8df) (C), \
953 (__mmask8) (U), (R)); })
959 return (__m512d) __builtin_ia32_vfmaddpd512_mask ((__v8df) __A,
969 return (__m512d) __builtin_ia32_vfmaddpd512_mask ((__v8df) __A,
979 return (__m512d) __builtin_ia32_vfmaddpd512_mask3 ((__v8df) __A,
989 return (__m512d) __builtin_ia32_vfmaddpd512_maskz ((__v8df) __A,
999 return (__m512d) __builtin_ia32_vfmaddpd512_mask ((__v8df) __A,
1009 return (__m512d) __builtin_ia32_vfmaddpd512_mask ((__v8df) __A,
1019 return (__m512d) __builtin_ia32_vfmaddpd512_maskz ((__v8df) __A,
1029 return (__m512d) __builtin_ia32_vfmaddpd512_mask (-(__v8df) __A,
1039 return (__m512d) __builtin_ia32_vfmaddpd512_mask3 (-(__v8df) __A,
1049 return (__m512d) __builtin_ia32_vfmaddpd512_maskz (-(__v8df) __A,
1059 return (__m512d) __builtin_ia32_vfmaddpd512_mask (-(__v8df) __A,
1069 return (__m512d) __builtin_ia32_vfmaddpd512_maskz (-(__v8df) __A,
1076 #define _mm512_fmadd_round_ps(A, B, C, R) __extension__ ({ \
1077 (__m512) __builtin_ia32_vfmaddps512_mask ((__v16sf) (A), \
1078 (__v16sf) (B), (__v16sf) (C), \
1079 (__mmask16) -1, (R)); })
1082 #define _mm512_mask_fmadd_round_ps(A, U, B, C, R) __extension__ ({ \
1083 (__m512) __builtin_ia32_vfmaddps512_mask ((__v16sf) (A), \
1084 (__v16sf) (B), (__v16sf) (C), \
1085 (__mmask16) (U), (R)); })
1088 #define _mm512_mask3_fmadd_round_ps(A, B, C, U, R) __extension__ ({ \
1089 (__m512) __builtin_ia32_vfmaddps512_mask3 ((__v16sf) (A), \
1090 (__v16sf) (B), (__v16sf) (C), \
1091 (__mmask16) (U), (R)); })
1094 #define _mm512_maskz_fmadd_round_ps(U, A, B, C, R) __extension__ ({ \
1095 (__m512) __builtin_ia32_vfmaddps512_maskz ((__v16sf) (A), \
1096 (__v16sf) (B), (__v16sf) (C), \
1097 (__mmask16) (U), (R)); })
1100 #define _mm512_fmsub_round_ps(A, B, C, R) __extension__ ({ \
1101 (__m512) __builtin_ia32_vfmaddps512_mask ((__v16sf) (A), \
1102 (__v16sf) (B), -(__v16sf) (C), \
1103 (__mmask16) -1, (R)); })
1106 #define _mm512_mask_fmsub_round_ps(A, U, B, C, R) __extension__ ({ \
1107 (__m512) __builtin_ia32_vfmaddps512_mask ((__v16sf) (A), \
1108 (__v16sf) (B), -(__v16sf) (C), \
1109 (__mmask16) (U), (R)); })
1112 #define _mm512_maskz_fmsub_round_ps(U, A, B, C, R) __extension__ ({ \
1113 (__m512) __builtin_ia32_vfmaddps512_maskz ((__v16sf) (A), \
1114 (__v16sf) (B), -(__v16sf) (C), \
1115 (__mmask16) (U), (R)); })
1118 #define _mm512_fnmadd_round_ps(A, B, C, R) __extension__ ({ \
1119 (__m512) __builtin_ia32_vfmaddps512_mask (-(__v16sf) (A), \
1120 (__v16sf) (B), (__v16sf) (C), \
1121 (__mmask16) -1, (R)); })
1124 #define _mm512_mask3_fnmadd_round_ps(A, B, C, U, R) __extension__ ({ \
1125 (__m512) __builtin_ia32_vfmaddps512_mask3 (-(__v16sf) (A), \
1126 (__v16sf) (B), (__v16sf) (C), \
1127 (__mmask16) (U), (R)); })
1130 #define _mm512_maskz_fnmadd_round_ps(U, A, B, C, R) __extension__ ({ \
1131 (__m512) __builtin_ia32_vfmaddps512_maskz (-(__v16sf) (A), \
1132 (__v16sf) (B), (__v16sf) (C), \
1133 (__mmask16) (U), (R)); })
1136 #define _mm512_fnmsub_round_ps(A, B, C, R) __extension__ ({ \
1137 (__m512) __builtin_ia32_vfmaddps512_mask (-(__v16sf) (A), \
1138 (__v16sf) (B), -(__v16sf) (C), \
1139 (__mmask16) -1, (R)); })
1142 #define _mm512_maskz_fnmsub_round_ps(U, A, B, C, R) __extension__ ({ \
1143 (__m512) __builtin_ia32_vfmaddps512_maskz (-(__v16sf) (A), \
1144 (__v16sf) (B), -(__v16sf) (C), \
1145 (__mmask16) (U), (R)); })
1151 return (__m512) __builtin_ia32_vfmaddps512_mask ((__v16sf) __A,
1161 return (__m512) __builtin_ia32_vfmaddps512_mask ((__v16sf) __A,
1171 return (__m512) __builtin_ia32_vfmaddps512_mask3 ((__v16sf) __A,
1181 return (__m512) __builtin_ia32_vfmaddps512_maskz ((__v16sf) __A,
1191 return (__m512) __builtin_ia32_vfmaddps512_mask ((__v16sf) __A,
1201 return (__m512) __builtin_ia32_vfmaddps512_mask ((__v16sf) __A,
1211 return (__m512) __builtin_ia32_vfmaddps512_maskz ((__v16sf) __A,
1221 return (__m512) __builtin_ia32_vfmaddps512_mask (-(__v16sf) __A,
1231 return (__m512) __builtin_ia32_vfmaddps512_mask3 (-(__v16sf) __A,
1241 return (__m512) __builtin_ia32_vfmaddps512_maskz (-(__v16sf) __A,
1251 return (__m512) __builtin_ia32_vfmaddps512_mask (-(__v16sf) __A,
1261 return (__m512) __builtin_ia32_vfmaddps512_maskz (-(__v16sf) __A,
1268 #define _mm512_fmaddsub_round_pd(A, B, C, R) __extension__ ({ \
1269 (__m512d) __builtin_ia32_vfmaddsubpd512_mask ((__v8df) (A), \
1270 (__v8df) (B), (__v8df) (C), \
1271 (__mmask8) -1, (R)); })
1274 #define _mm512_mask_fmaddsub_round_pd(A, U, B, C, R) __extension__ ({ \
1275 (__m512d) __builtin_ia32_vfmaddsubpd512_mask ((__v8df) (A), \
1276 (__v8df) (B), (__v8df) (C), \
1277 (__mmask8) (U), (R)); })
1280 #define _mm512_mask3_fmaddsub_round_pd(A, B, C, U, R) __extension__ ({ \
1281 (__m512d) __builtin_ia32_vfmaddsubpd512_mask3 ((__v8df) (A), \
1282 (__v8df) (B), (__v8df) (C), \
1283 (__mmask8) (U), (R)); })
1286 #define _mm512_maskz_fmaddsub_round_pd(U, A, B, C, R) __extension__ ({ \
1287 (__m512d) __builtin_ia32_vfmaddsubpd512_maskz ((__v8df) (A), \
1288 (__v8df) (B), (__v8df) (C), \
1289 (__mmask8) (U), (R)); })
1292 #define _mm512_fmsubadd_round_pd(A, B, C, R) __extension__ ({ \
1293 (__m512d) __builtin_ia32_vfmaddsubpd512_mask ((__v8df) (A), \
1294 (__v8df) (B), -(__v8df) (C), \
1295 (__mmask8) -1, (R)); })
1298 #define _mm512_mask_fmsubadd_round_pd(A, U, B, C, R) __extension__ ({ \
1299 (__m512d) __builtin_ia32_vfmaddsubpd512_mask ((__v8df) (A), \
1300 (__v8df) (B), -(__v8df) (C), \
1301 (__mmask8) (U), (R)); })
1304 #define _mm512_maskz_fmsubadd_round_pd(U, A, B, C, R) __extension__ ({ \
1305 (__m512d) __builtin_ia32_vfmaddsubpd512_maskz ((__v8df) (A), \
1306 (__v8df) (B), -(__v8df) (C), \
1307 (__mmask8) (U), (R)); })
1313 return (__m512d) __builtin_ia32_vfmaddsubpd512_mask ((__v8df) __A,
1323 return (__m512d) __builtin_ia32_vfmaddsubpd512_mask ((__v8df) __A,
1333 return (__m512d) __builtin_ia32_vfmaddsubpd512_mask3 ((__v8df) __A,
1343 return (__m512d) __builtin_ia32_vfmaddsubpd512_maskz ((__v8df) __A,
1353 return (__m512d) __builtin_ia32_vfmaddsubpd512_mask ((__v8df) __A,
1363 return (__m512d) __builtin_ia32_vfmaddsubpd512_mask ((__v8df) __A,
1373 return (__m512d) __builtin_ia32_vfmaddsubpd512_maskz ((__v8df) __A,
1380 #define _mm512_fmaddsub_round_ps(A, B, C, R) __extension__ ({ \
1381 (__m512) __builtin_ia32_vfmaddsubps512_mask ((__v16sf) (A), \
1382 (__v16sf) (B), (__v16sf) (C), \
1383 (__mmask16) -1, (R)); })
1386 #define _mm512_mask_fmaddsub_round_ps(A, U, B, C, R) __extension__ ({ \
1387 (__m512) __builtin_ia32_vfmaddsubps512_mask ((__v16sf) (A), \
1388 (__v16sf) (B), (__v16sf) (C), \
1389 (__mmask16) (U), (R)); })
1392 #define _mm512_mask3_fmaddsub_round_ps(A, B, C, U, R) __extension__ ({ \
1393 (__m512) __builtin_ia32_vfmaddsubps512_mask3 ((__v16sf) (A), \
1394 (__v16sf) (B), (__v16sf) (C), \
1395 (__mmask16) (U), (R)); })
1398 #define _mm512_maskz_fmaddsub_round_ps(U, A, B, C, R) __extension__ ({ \
1399 (__m512) __builtin_ia32_vfmaddsubps512_maskz ((__v16sf) (A), \
1400 (__v16sf) (B), (__v16sf) (C), \
1401 (__mmask16) (U), (R)); })
1404 #define _mm512_fmsubadd_round_ps(A, B, C, R) __extension__ ({ \
1405 (__m512) __builtin_ia32_vfmaddsubps512_mask ((__v16sf) (A), \
1406 (__v16sf) (B), -(__v16sf) (C), \
1407 (__mmask16) -1, (R)); })
1410 #define _mm512_mask_fmsubadd_round_ps(A, U, B, C, R) __extension__ ({ \
1411 (__m512) __builtin_ia32_vfmaddsubps512_mask ((__v16sf) (A), \
1412 (__v16sf) (B), -(__v16sf) (C), \
1413 (__mmask16) (U), (R)); })
1416 #define _mm512_maskz_fmsubadd_round_ps(U, A, B, C, R) __extension__ ({ \
1417 (__m512) __builtin_ia32_vfmaddsubps512_maskz ((__v16sf) (A), \
1418 (__v16sf) (B), -(__v16sf) (C), \
1419 (__mmask16) (U), (R)); })
1425 return (__m512) __builtin_ia32_vfmaddsubps512_mask ((__v16sf) __A,
1435 return (__m512) __builtin_ia32_vfmaddsubps512_mask ((__v16sf) __A,
1445 return (__m512) __builtin_ia32_vfmaddsubps512_mask3 ((__v16sf) __A,
1455 return (__m512) __builtin_ia32_vfmaddsubps512_maskz ((__v16sf) __A,
1465 return (__m512) __builtin_ia32_vfmaddsubps512_mask ((__v16sf) __A,
1475 return (__m512) __builtin_ia32_vfmaddsubps512_mask ((__v16sf) __A,
1485 return (__m512) __builtin_ia32_vfmaddsubps512_maskz ((__v16sf) __A,
1492 #define _mm512_mask3_fmsub_round_pd(A, B, C, U, R) __extension__ ({ \
1493 (__m512d) __builtin_ia32_vfmsubpd512_mask3 ((__v8df) (A), \
1494 (__v8df) (B), (__v8df) (C), \
1495 (__mmask8) (U), (R)); })
1501 return (__m512d) __builtin_ia32_vfmsubpd512_mask3 ((__v8df) __A,
1508 #define _mm512_mask3_fmsub_round_ps(A, B, C, U, R) __extension__ ({ \
1509 (__m512) __builtin_ia32_vfmsubps512_mask3 ((__v16sf) (A), \
1510 (__v16sf) (B), (__v16sf) (C), \
1511 (__mmask16) (U), (R)); })
1517 return (__m512) __builtin_ia32_vfmsubps512_mask3 ((__v16sf) __A,
1524 #define _mm512_mask3_fmsubadd_round_pd(A, B, C, U, R) __extension__ ({ \
1525 (__m512d) __builtin_ia32_vfmsubaddpd512_mask3 ((__v8df) (A), \
1526 (__v8df) (B), (__v8df) (C), \
1527 (__mmask8) (U), (R)); })
1533 return (__m512d) __builtin_ia32_vfmsubaddpd512_mask3 ((__v8df) __A,
1540 #define _mm512_mask3_fmsubadd_round_ps(A, B, C, U, R) __extension__ ({ \
1541 (__m512) __builtin_ia32_vfmsubaddps512_mask3 ((__v16sf) (A), \
1542 (__v16sf) (B), (__v16sf) (C), \
1543 (__mmask16) (U), (R)); })
1549 return (__m512) __builtin_ia32_vfmsubaddps512_mask3 ((__v16sf) __A,
1556 #define _mm512_mask_fnmadd_round_pd(A, U, B, C, R) __extension__ ({ \
1557 (__m512d) __builtin_ia32_vfnmaddpd512_mask ((__v8df) (A), \
1558 (__v8df) (B), (__v8df) (C), \
1559 (__mmask8) (U), (R)); })
1565 return (__m512d) __builtin_ia32_vfnmaddpd512_mask ((__v8df) __A,
1572 #define _mm512_mask_fnmadd_round_ps(A, U, B, C, R) __extension__ ({ \
1573 (__m512) __builtin_ia32_vfnmaddps512_mask ((__v16sf) (A), \
1574 (__v16sf) (B), (__v16sf) (C), \
1575 (__mmask16) (U), (R)); })
1581 return (__m512) __builtin_ia32_vfnmaddps512_mask ((__v16sf) __A,
1588 #define _mm512_mask_fnmsub_round_pd(A, U, B, C, R) __extension__ ({ \
1589 (__m512d) __builtin_ia32_vfnmsubpd512_mask ((__v8df) (A), \
1590 (__v8df) (B), (__v8df) (C), \
1591 (__mmask8) (U), (R)); })
1594 #define _mm512_mask3_fnmsub_round_pd(A, B, C, U, R) __extension__ ({ \
1595 (__m512d) __builtin_ia32_vfnmsubpd512_mask3 ((__v8df) (A), \
1596 (__v8df) (B), (__v8df) (C), \
1597 (__mmask8) (U), (R)); })
1603 return (__m512d) __builtin_ia32_vfnmsubpd512_mask ((__v8df) __A,
1613 return (__m512d) __builtin_ia32_vfnmsubpd512_mask3 ((__v8df) __A,
1620 #define _mm512_mask_fnmsub_round_ps(A, U, B, C, R) __extension__ ({ \
1621 (__m512) __builtin_ia32_vfnmsubps512_mask ((__v16sf) (A), \
1622 (__v16sf) (B), (__v16sf) (C), \
1623 (__mmask16) (U), (R)); })
1626 #define _mm512_mask3_fnmsub_round_ps(A, B, C, U, R) __extension__ ({ \
1627 (__m512) __builtin_ia32_vfnmsubps512_mask3 ((__v16sf) (A), \
1628 (__v16sf) (B), (__v16sf) (C), \
1629 (__mmask16) (U), (R)); })
1635 return (__m512) __builtin_ia32_vfnmsubps512_mask ((__v16sf) __A,
1645 return (__m512) __builtin_ia32_vfnmsubps512_mask3 ((__v16sf) __A,
1659 return (__m512i) __builtin_ia32_vpermt2vard512_mask ((__v16si) __I
1668 return (__m512i) __builtin_ia32_vpermt2varq512_mask ((__v8di) __I
1678 return (__m512d) __builtin_ia32_vpermt2varpd512_mask ((__v8di) __I
1687 return (__m512) __builtin_ia32_vpermt2varps512_mask ((__v16si) __I
1694 #define _mm512_alignr_epi64(A, B, I) __extension__ ({ \
1695 (__m512i)__builtin_ia32_alignq512_mask((__v8di)(__m512i)(A), \
1696 (__v8di)(__m512i)(B), \
1697 (I), (__v8di)_mm512_setzero_si512(), \
1700 #define _mm512_alignr_epi32(A, B, I) __extension__ ({ \
1701 (__m512i)__builtin_ia32_alignd512_mask((__v16si)(__m512i)(A), \
1702 (__v16si)(__m512i)(B), \
1703 (I), (__v16si)_mm512_setzero_si512(), \
1708 #define _mm512_extractf64x4_pd(A, I) __extension__ ({ \
1709 __m512d __A = (A); \
1711 __builtin_ia32_extractf64x4_mask((__v8df)__A, \
1713 (__v4df)_mm256_setzero_si256(), \
1716 #define _mm512_extractf32x4_ps(A, I) __extension__ ({ \
1719 __builtin_ia32_extractf32x4_mask((__v16sf)__A, \
1721 (__v4sf)_mm_setzero_ps(), \
1729 return (__m512d) __builtin_ia32_blendmpd_512_mask ((__v8df) __A,
1737 return (__m512) __builtin_ia32_blendmps_512_mask ((__v16sf) __A,
1745 return (__m512i) __builtin_ia32_blendmq_512_mask ((__v8di) __A,
1753 return (__m512i) __builtin_ia32_blendmd_512_mask ((__v16si) __A,
1760 #define _mm512_cmp_round_ps_mask(A, B, P, R) __extension__ ({ \
1761 (__mmask16)__builtin_ia32_cmpps512_mask((__v16sf)(__m512)(A), \
1762 (__v16sf)(__m512)(B), \
1763 (P), (__mmask16)-1, (R)); })
1765 #define _mm512_mask_cmp_round_ps_mask(U, A, B, P, R) __extension__ ({ \
1766 (__mmask16)__builtin_ia32_cmpps512_mask((__v16sf)(__m512)(A), \
1767 (__v16sf)(__m512)(B), \
1768 (P), (__mmask16)(U), (R)); })
1770 #define _mm512_cmp_ps_mask(A, B, P) \
1771 _mm512_cmp_round_ps_mask((A), (B), (P), _MM_FROUND_CUR_DIRECTION)
1773 #define _mm512_mask_cmp_ps_mask(U, A, B, P) \
1774 _mm512_mask_cmp_round_ps_mask((U), (A), (B), (P), _MM_FROUND_CUR_DIRECTION)
1776 #define _mm512_cmp_round_pd_mask(A, B, P, R) __extension__ ({ \
1777 (__mmask8)__builtin_ia32_cmppd512_mask((__v8df)(__m512d)(A), \
1778 (__v8df)(__m512d)(B), \
1779 (P), (__mmask8)-1, (R)); })
1781 #define _mm512_mask_cmp_round_pd_mask(U, A, B, P, R) __extension__ ({ \
1782 (__mmask8)__builtin_ia32_cmppd512_mask((__v8df)(__m512d)(A), \
1783 (__v8df)(__m512d)(B), \
1784 (P), (__mmask8)(U), (R)); })
1786 #define _mm512_cmp_pd_mask(A, B, P) \
1787 _mm512_cmp_round_pd_mask((A), (B), (P), _MM_FROUND_CUR_DIRECTION)
1789 #define _mm512_mask_cmp_pd_mask(U, A, B, P) \
1790 _mm512_mask_cmp_round_pd_mask((U), (A), (B), (P), _MM_FROUND_CUR_DIRECTION)
1797 return (__m512i) __builtin_ia32_cvttps2udq512_mask ((__v16sf) __A,
1804 #define _mm512_cvt_roundepi32_ps(A, R) __extension__ ({ \
1805 (__m512)__builtin_ia32_cvtdq2ps512_mask((__v16si)(A), \
1806 (__v16sf)_mm512_setzero_ps(), \
1807 (__mmask16)-1, (R)); })
1809 #define _mm512_cvt_roundepu32_ps(A, R) __extension__ ({ \
1810 (__m512)__builtin_ia32_cvtudq2ps512_mask((__v16si)(A), \
1811 (__v16sf)_mm512_setzero_ps(), \
1812 (__mmask16)-1, (R)); })
1817 return (__m512d) __builtin_ia32_cvtdq2pd512_mask ((__v8si) __A,
1826 return (__m512d) __builtin_ia32_cvtudq2pd512_mask ((__v8si) __A,
1832 #define _mm512_cvt_roundpd_ps(A, R) __extension__ ({ \
1833 (__m256)__builtin_ia32_cvtpd2ps512_mask((__v8df)(A), \
1834 (__v8sf)_mm256_setzero_ps(), \
1835 (__mmask8)-1, (R)); })
1837 #define _mm512_cvtps_ph(A, I) __extension__ ({ \
1838 (__m256i)__builtin_ia32_vcvtps2ph512_mask((__v16sf)(A), (I), \
1839 (__v16hi)_mm256_setzero_si256(), \
1845 return (__m512) __builtin_ia32_vcvtph2ps512_mask ((__v16hi) __A,
1856 __builtin_ia32_cvttps2dq512_mask((__v16sf) a,
1864 return (__m256i)__builtin_ia32_cvttpd2dq512_mask((__v8df) a,
1870 #define _mm512_cvtt_roundpd_epi32(A, R) __extension__ ({ \
1871 (__m256i)__builtin_ia32_cvttpd2dq512_mask((__v8df)(A), \
1872 (__v8si)_mm256_setzero_si256(), \
1873 (__mmask8)-1, (R)); })
1875 #define _mm512_cvtt_roundps_epi32(A, R) __extension__ ({ \
1876 (__m512i)__builtin_ia32_cvttps2dq512_mask((__v16sf)(A), \
1877 (__v16si)_mm512_setzero_si512(), \
1878 (__mmask16)-1, (R)); })
1880 #define _mm512_cvt_roundps_epi32(A, R) __extension__ ({ \
1881 (__m512i)__builtin_ia32_cvtps2dq512_mask((__v16sf)(A), \
1882 (__v16si)_mm512_setzero_si512(), \
1883 (__mmask16)-1, (R)); })
1885 #define _mm512_cvt_roundpd_epi32(A, R) __extension__ ({ \
1886 (__m256i)__builtin_ia32_cvtpd2dq512_mask((__v8df)(A), \
1887 (__v8si)_mm256_setzero_si256(), \
1888 (__mmask8)-1, (R)); })
1890 #define _mm512_cvt_roundps_epu32(A, R) __extension__ ({ \
1891 (__m512i)__builtin_ia32_cvtps2udq512_mask((__v16sf)(A), \
1892 (__v16si)_mm512_setzero_si512(), \
1893 (__mmask16)-1, (R)); })
1895 #define _mm512_cvt_roundpd_epu32(A, R) __extension__ ({ \
1896 (__m256i)__builtin_ia32_cvtpd2udq512_mask((__v8df)(A), \
1897 (__v8si)_mm256_setzero_si256(), \
1898 (__mmask8) -1, (R)); })
1904 return __builtin_shufflevector(__a, __b, 1, 9, 1+2, 9+2, 1+4, 9+4, 1+6, 9+6);
1910 return __builtin_shufflevector(__a, __b, 0, 8, 0+2, 8+2, 0+4, 8+4, 0+6, 8+6);
1916 return __builtin_shufflevector(__a, __b,
1918 2+4, 18+4, 3+4, 19+4,
1919 2+8, 18+8, 3+8, 19+8,
1920 2+12, 18+12, 3+12, 19+12);
1926 return __builtin_shufflevector(__a, __b,
1928 0+4, 16+4, 1+4, 17+4,
1929 0+8, 16+8, 1+8, 17+8,
1930 0+12, 16+12, 1+12, 17+12);
1938 return (__mmask16) __builtin_ia32_ptestmd512 ((__v16si) __A,
1946 return (__mmask8) __builtin_ia32_ptestmq512 ((__v8di) __A,
1956 return (__m512i) __builtin_ia32_loaddqusi512_mask ((
const __v16si *)__P,
1965 return (__m512i) __builtin_ia32_loaddqudi512_mask ((
const __v8di *)__P,
1974 return (__m512) __builtin_ia32_loadups512_mask ((
const __v16sf *)__P,
1983 return (__m512d) __builtin_ia32_loadupd512_mask ((
const __v8df *)__P,
1992 return (__m512) __builtin_ia32_loadaps512_mask ((
const __v16sf *)__P,
2001 return (__m512d) __builtin_ia32_loadapd512_mask ((
const __v8df *)__P,
2013 return ((
struct __loadu_pd*)__p)->__v;
2022 return ((
struct __loadu_ps*)__p)->__v;
2028 return (__m512) __builtin_ia32_loadaps512_mask ((
const __v16sf *)__p,
2037 return (__m512d) __builtin_ia32_loadapd512_mask ((
const __v8df *)__p,
2048 __builtin_ia32_storedqudi512_mask ((__v8di *)__P, (__v8di) __A,
2055 __builtin_ia32_storedqusi512_mask ((__v16si *)__P, (__v16si) __A,
2062 __builtin_ia32_storeupd512_mask ((__v8df *)__P, (__v8df) __A, (__mmask8) __U);
2068 __builtin_ia32_storeupd512_mask((__v8df *)__P, (__v8df)__A, (__mmask8)-1);
2074 __builtin_ia32_storeups512_mask ((__v16sf *)__P, (__v16sf) __A,
2081 __builtin_ia32_storeups512_mask((__v16sf *)__P, (__v16sf)__A, (__mmask16)-1);
2087 __builtin_ia32_storeapd512_mask ((__v8df *)__P, (__v8df) __A, (__mmask8) __U);
2093 *(__m512d*)__P = __A;
2099 __builtin_ia32_storeaps512_mask ((__v16sf *)__P, (__v16sf) __A,
2106 *(__m512*)__P = __A;
2114 return __builtin_ia32_knothi(__M);
2121 return (__mmask16)__builtin_ia32_pcmpeqd512_mask((__v16si)__a, (__v16si)__b,
2127 return (__mmask16)__builtin_ia32_pcmpeqd512_mask((__v16si)__a, (__v16si)__b,
2133 return (__mmask16)__builtin_ia32_ucmpd512_mask((__v16si)__a, (__v16si)__b, 0,
2139 return (__mmask16)__builtin_ia32_ucmpd512_mask((__v16si)__a, (__v16si)__b, 0,
2145 return (__mmask8)__builtin_ia32_pcmpeqq512_mask((__v8di)__a, (__v8di)__b,
2151 return (__mmask8)__builtin_ia32_pcmpeqq512_mask((__v8di)__a, (__v8di)__b,
2157 return (__mmask8)__builtin_ia32_ucmpq512_mask((__v8di)__a, (__v8di)__b, 0,
2163 return (__mmask8)__builtin_ia32_ucmpq512_mask((__v8di)__a, (__v8di)__b, 0,
2169 return (__mmask16)__builtin_ia32_cmpd512_mask((__v16si)__a, (__v16si)__b, 5,
2175 return (__mmask16)__builtin_ia32_cmpd512_mask((__v16si)__a, (__v16si)__b, 5,
2181 return (__mmask16)__builtin_ia32_ucmpd512_mask((__v16si)__a, (__v16si)__b, 5,
2187 return (__mmask16)__builtin_ia32_ucmpd512_mask((__v16si)__a, (__v16si)__b, 5,
2193 return (__mmask8)__builtin_ia32_cmpq512_mask((__v8di)__a, (__v8di)__b, 5,
2199 return (__mmask8)__builtin_ia32_cmpq512_mask((__v8di)__a, (__v8di)__b, 5,
2205 return (__mmask8)__builtin_ia32_ucmpq512_mask((__v8di)__a, (__v8di)__b, 5,
2211 return (__mmask8)__builtin_ia32_ucmpq512_mask((__v8di)__a, (__v8di)__b, 5,
2217 return (__mmask16)__builtin_ia32_pcmpgtd512_mask((__v16si)__a, (__v16si)__b,
2223 return (__mmask16)__builtin_ia32_pcmpgtd512_mask((__v16si)__a, (__v16si)__b,
2229 return (__mmask16)__builtin_ia32_ucmpd512_mask((__v16si)__a, (__v16si)__b, 6,
2235 return (__mmask16)__builtin_ia32_ucmpd512_mask((__v16si)__a, (__v16si)__b, 6,
2241 return (__mmask8)__builtin_ia32_pcmpgtq512_mask((__v8di)__a, (__v8di)__b,
2247 return (__mmask8)__builtin_ia32_pcmpgtq512_mask((__v8di)__a, (__v8di)__b,
2253 return (__mmask8)__builtin_ia32_ucmpq512_mask((__v8di)__a, (__v8di)__b, 6,
2259 return (__mmask8)__builtin_ia32_ucmpq512_mask((__v8di)__a, (__v8di)__b, 6,
2265 return (__mmask16)__builtin_ia32_cmpd512_mask((__v16si)__a, (__v16si)__b, 2,
2271 return (__mmask16)__builtin_ia32_cmpd512_mask((__v16si)__a, (__v16si)__b, 2,
2277 return (__mmask16)__builtin_ia32_ucmpd512_mask((__v16si)__a, (__v16si)__b, 2,
2283 return (__mmask16)__builtin_ia32_ucmpd512_mask((__v16si)__a, (__v16si)__b, 2,
2289 return (__mmask8)__builtin_ia32_cmpq512_mask((__v8di)__a, (__v8di)__b, 2,
2295 return (__mmask8)__builtin_ia32_cmpq512_mask((__v8di)__a, (__v8di)__b, 2,
2301 return (__mmask8)__builtin_ia32_ucmpq512_mask((__v8di)__a, (__v8di)__b, 2,
2307 return (__mmask8)__builtin_ia32_ucmpq512_mask((__v8di)__a, (__v8di)__b, 2,
2313 return (__mmask16)__builtin_ia32_cmpd512_mask((__v16si)__a, (__v16si)__b, 1,
2319 return (__mmask16)__builtin_ia32_cmpd512_mask((__v16si)__a, (__v16si)__b, 1,
2325 return (__mmask16)__builtin_ia32_ucmpd512_mask((__v16si)__a, (__v16si)__b, 1,
2331 return (__mmask16)__builtin_ia32_ucmpd512_mask((__v16si)__a, (__v16si)__b, 1,
2337 return (__mmask8)__builtin_ia32_cmpq512_mask((__v8di)__a, (__v8di)__b, 1,
2343 return (__mmask8)__builtin_ia32_cmpq512_mask((__v8di)__a, (__v8di)__b, 1,
2349 return (__mmask8)__builtin_ia32_ucmpq512_mask((__v8di)__a, (__v8di)__b, 1,
2355 return (__mmask8)__builtin_ia32_ucmpq512_mask((__v8di)__a, (__v8di)__b, 1,
2361 return (__mmask16)__builtin_ia32_cmpd512_mask((__v16si)__a, (__v16si)__b, 4,
2367 return (__mmask16)__builtin_ia32_cmpd512_mask((__v16si)__a, (__v16si)__b, 4,
2373 return (__mmask16)__builtin_ia32_ucmpd512_mask((__v16si)__a, (__v16si)__b, 4,
2379 return (__mmask16)__builtin_ia32_ucmpd512_mask((__v16si)__a, (__v16si)__b, 4,
2385 return (__mmask8)__builtin_ia32_cmpq512_mask((__v8di)__a, (__v8di)__b, 4,
2391 return (__mmask8)__builtin_ia32_cmpq512_mask((__v8di)__a, (__v8di)__b, 4,
2397 return (__mmask8)__builtin_ia32_ucmpq512_mask((__v8di)__a, (__v8di)__b, 4,
2403 return (__mmask8)__builtin_ia32_ucmpq512_mask((__v8di)__a, (__v8di)__b, 4,
2407 #define _mm512_cmp_epi32_mask(a, b, p) __extension__ ({ \
2408 __m512i __a = (a); \
2409 __m512i __b = (b); \
2410 (__mmask16)__builtin_ia32_cmpd512_mask((__v16si)__a, (__v16si)__b, (p), \
2413 #define _mm512_cmp_epu32_mask(a, b, p) __extension__ ({ \
2414 __m512i __a = (a); \
2415 __m512i __b = (b); \
2416 (__mmask16)__builtin_ia32_ucmpd512_mask((__v16si)__a, (__v16si)__b, (p), \
2419 #define _mm512_cmp_epi64_mask(a, b, p) __extension__ ({ \
2420 __m512i __a = (a); \
2421 __m512i __b = (b); \
2422 (__mmask8)__builtin_ia32_cmpq512_mask((__v8di)__a, (__v8di)__b, (p), \
2425 #define _mm512_cmp_epu64_mask(a, b, p) __extension__ ({ \
2426 __m512i __a = (a); \
2427 __m512i __b = (b); \
2428 (__mmask8)__builtin_ia32_ucmpq512_mask((__v8di)__a, (__v8di)__b, (p), \
2431 #define _mm512_mask_cmp_epi32_mask(m, a, b, p) __extension__ ({ \
2432 __m512i __a = (a); \
2433 __m512i __b = (b); \
2434 (__mmask16)__builtin_ia32_cmpd512_mask((__v16si)__a, (__v16si)__b, (p), \
2437 #define _mm512_mask_cmp_epu32_mask(m, a, b, p) __extension__ ({ \
2438 __m512i __a = (a); \
2439 __m512i __b = (b); \
2440 (__mmask16)__builtin_ia32_ucmpd512_mask((__v16si)__a, (__v16si)__b, (p), \
2443 #define _mm512_mask_cmp_epi64_mask(m, a, b, p) __extension__ ({ \
2444 __m512i __a = (a); \
2445 __m512i __b = (b); \
2446 (__mmask8)__builtin_ia32_cmpq512_mask((__v8di)__a, (__v8di)__b, (p), \
2449 #define _mm512_mask_cmp_epu64_mask(m, a, b, p) __extension__ ({ \
2450 __m512i __a = (a); \
2451 __m512i __b = (b); \
2452 (__mmask8)__builtin_ia32_ucmpq512_mask((__v8di)__a, (__v8di)__b, (p), \
2455 #undef __DEFAULT_FN_ATTRS
2457 #endif // __AVX512FINTRIN_H
static __inline __m512 __DEFAULT_FN_ATTRS _mm512_cvtph_ps(__m256i __A)
static __inline__ __mmask16 __DEFAULT_FN_ATTRS _mm512_cmpeq_epi32_mask(__m512i __a, __m512i __b)
static __inline void __DEFAULT_FN_ATTRS _mm512_mask_store_pd(void *__P, __mmask8 __U, __m512d __A)
static __inline__ __mmask16 __DEFAULT_FN_ATTRS _mm512_mask_cmpgt_epu32_mask(__mmask16 __u, __m512i __a, __m512i __b)
static __inline __m512i __DEFAULT_FN_ATTRS _mm512_maskz_mullo_epi32(__mmask16 __M, __m512i __A, __m512i __B)
static __inline__ __m512 __DEFAULT_FN_ATTRS _mm512_fnmsub_ps(__m512 __A, __m512 __B, __m512 __C)
static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_xor_si512(__m512i __a, __m512i __b)
static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_maskz_add_epi32(__mmask16 __U, __m512i __A, __m512i __B)
static __inline__ __m512d __DEFAULT_FN_ATTRS _mm512_mask3_fmadd_pd(__m512d __A, __m512d __B, __m512d __C, __mmask8 __U)
static __inline __m512 __DEFAULT_FN_ATTRS _mm512_unpackhi_ps(__m512 __a, __m512 __b)
static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_mask_and_epi32(__m512i __src, __mmask16 __k, __m512i __a, __m512i __b)
static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_sub_epi32(__m512i __A, __m512i __B)
static __inline__ __mmask8 __DEFAULT_FN_ATTRS _mm512_cmpeq_epi64_mask(__m512i __a, __m512i __b)
static __inline __m512i __DEFAULT_FN_ATTRS _mm512_mask_blend_epi64(__mmask8 __U, __m512i __A, __m512i __W)
static __inline__ __m512 __DEFAULT_FN_ATTRS _mm512_mask3_fmsub_ps(__m512 __A, __m512 __B, __m512 __C, __mmask16 __U)
static __inline __m512i __DEFAULT_FN_ATTRS _mm512_mul_epu32(__m512i __X, __m512i __Y)
static __inline __m512 __DEFAULT_FN_ATTRS _mm512_sub_ps(__m512 __a, __m512 __b)
static __inline__ __m512d __DEFAULT_FN_ATTRS _mm512_maskz_fmaddsub_pd(__mmask8 __U, __m512d __A, __m512d __B, __m512d __C)
static __inline __m512d __DEFAULT_FN_ATTRS _mm512_setzero_pd(void)
static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_maskz_add_epi64(__mmask8 __U, __m512i __A, __m512i __B)
static __inline void __DEFAULT_FN_ATTRS _mm512_storeu_pd(void *__P, __m512d __A)
static __inline __m512d __DEFAULT_FN_ATTRS _mm512_floor_pd(__m512d __A)
static __inline__ __m512d __DEFAULT_FN_ATTRS _mm512_mask3_fnmsub_pd(__m512d __A, __m512d __B, __m512d __C, __mmask8 __U)
static __inline__ __m512d __DEFAULT_FN_ATTRS _mm512_maskz_fnmsub_pd(__mmask8 __U, __m512d __A, __m512d __B, __m512d __C)
static __inline __m512i __DEFAULT_FN_ATTRS _mm512_min_epu64(__m512i __A, __m512i __B)
static __inline __m128 __DEFAULT_FN_ATTRS _mm512_castps512_ps128(__m512 __a)
static __inline__ __m512 __DEFAULT_FN_ATTRS _mm512_mask3_fmsubadd_ps(__m512 __A, __m512 __B, __m512 __C, __mmask16 __U)
static __inline__ __m512 __DEFAULT_FN_ATTRS _mm512_mask_fmsubadd_ps(__m512 __A, __mmask16 __U, __m512 __B, __m512 __C)
static __inline__ __mmask16 __DEFAULT_FN_ATTRS _mm512_cmpgt_epi32_mask(__m512i __a, __m512i __b)
static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_mask_sub_epi64(__m512i __W, __mmask8 __U, __m512i __A, __m512i __B)
static __inline__ __m512 __DEFAULT_FN_ATTRS _mm512_rsqrt14_ps(__m512 __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_maskz_and_epi64(__mmask8 __k, __m512i __a, __m512i __b)
static __inline__ __mmask8 __DEFAULT_FN_ATTRS _mm512_cmple_epu64_mask(__m512i __a, __m512i __b)
static __inline__ __m512d __DEFAULT_FN_ATTRS _mm512_fnmsub_pd(__m512d __A, __m512d __B, __m512d __C)
static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_mask_xor_epi32(__m512i __src, __mmask16 __k, __m512i __a, __m512i __b)
static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_maskz_or_epi64(__mmask8 __k, __m512i __a, __m512i __b)
static __inline__ __mmask8 __DEFAULT_FN_ATTRS _mm512_cmpeq_epu64_mask(__m512i __a, __m512i __b)
static __inline__ __mmask8 __DEFAULT_FN_ATTRS _mm512_cmpgt_epu64_mask(__m512i __a, __m512i __b)
static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_maskz_andnot_epi32(__mmask16 __U, __m512i __A, __m512i __B)
static __inline void __DEFAULT_FN_ATTRS _mm512_mask_store_ps(void *__P, __mmask16 __U, __m512 __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_maskz_xor_epi64(__mmask8 __k, __m512i __a, __m512i __b)
static __inline__ __m512d __DEFAULT_FN_ATTRS _mm512_fmadd_pd(__m512d __A, __m512d __B, __m512d __C)
static __inline__ __m512d __DEFAULT_FN_ATTRS _mm512_mask_fmaddsub_pd(__m512d __A, __mmask8 __U, __m512d __B, __m512d __C)
static __inline __m512 __DEFAULT_FN_ATTRS _mm512_maskz_load_ps(__mmask16 __U, void const *__P)
static __inline__ __m512 __DEFAULT_FN_ATTRS _mm512_mask_fmsub_ps(__m512 __A, __mmask16 __U, __m512 __B, __m512 __C)
static __inline __m512i __DEFAULT_FN_ATTRS _mm512_maskz_loadu_epi64(__mmask8 __U, void const *__P)
static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_and_epi32(__m512i __a, __m512i __b)
static __inline __m512 __DEFAULT_FN_ATTRS _mm512_setzero_ps(void)
static __inline __m512 __DEFAULT_FN_ATTRS _mm512_unpacklo_ps(__m512 __a, __m512 __b)
static __inline __m512i __DEFAULT_FN_ATTRS _mm512_mask_blend_epi32(__mmask16 __U, __m512i __A, __m512i __W)
static __inline __m512i __DEFAULT_FN_ATTRS _mm512_set1_epi32(int __s)
static __inline__ __m512 __DEFAULT_FN_ATTRS _mm512_min_ps(__m512 __A, __m512 __B)
static __inline__ __mmask16 __DEFAULT_FN_ATTRS _mm512_mask_cmplt_epi32_mask(__mmask16 __u, __m512i __a, __m512i __b)
static __inline__ __mmask16 __DEFAULT_FN_ATTRS _mm512_cmpneq_epu32_mask(__m512i __a, __m512i __b)
static __inline__ __mmask16 __DEFAULT_FN_ATTRS _mm512_mask_cmpge_epu32_mask(__mmask16 __u, __m512i __a, __m512i __b)
static __inline __m512i __DEFAULT_FN_ATTRS _mm512_max_epi64(__m512i __A, __m512i __B)
static __inline __m512i __DEFAULT_FN_ATTRS _mm512_permutex2var_epi64(__m512i __A, __m512i __I, __m512i __B)
static __inline__ __mmask16 __DEFAULT_FN_ATTRS _mm512_cmpgt_epu32_mask(__m512i __a, __m512i __b)
static __inline __m512 __DEFAULT_FN_ATTRS _mm512_add_ps(__m512 __a, __m512 __b)
static __inline__ __m512d __DEFAULT_FN_ATTRS _mm512_mask_fnmsub_pd(__m512d __A, __mmask8 __U, __m512d __B, __m512d __C)
static __inline __m512i __DEFAULT_FN_ATTRS _mm512_maskz_set1_epi64(__mmask8 __M, long long __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_or_epi64(__m512i __a, __m512i __b)
static __inline __m512 __DEFAULT_FN_ATTRS _mm512_loadu_ps(float const *__p)
static __inline__ __m512d __DEFAULT_FN_ATTRS _mm512_maskz_fmsub_pd(__mmask8 __U, __m512d __A, __m512d __B, __m512d __C)
static __inline__ __mmask8 __DEFAULT_FN_ATTRS _mm512_mask_cmpge_epi64_mask(__mmask8 __u, __m512i __a, __m512i __b)
static __inline__ __m512d __DEFAULT_FN_ATTRS _mm512_rcp14_pd(__m512d __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_maskz_sub_epi32(__mmask16 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_andnot_epi64(__m512i __A, __m512i __B)
static __inline__ __mmask16 __DEFAULT_FN_ATTRS _mm512_mask_cmple_epi32_mask(__mmask16 __u, __m512i __a, __m512i __b)
static __inline __m512i __DEFAULT_FN_ATTRS _mm512_min_epi64(__m512i __A, __m512i __B)
static __inline __m512d __DEFAULT_FN_ATTRS _mm512_cvtepu32_pd(__m256i __A)
static __inline__ __mmask8 __DEFAULT_FN_ATTRS _mm512_cmpgt_epi64_mask(__m512i __a, __m512i __b)
static __inline__ __mmask8 __DEFAULT_FN_ATTRS _mm512_cmpneq_epi64_mask(__m512i __a, __m512i __b)
static __inline__ __m128d __DEFAULT_FN_ATTRS _mm_rcp14_sd(__m128d __A, __m128d __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_mask_andnot_epi32(__m512i __W, __mmask16 __U, __m512i __A, __m512i __B)
static __inline __m512d __DEFAULT_FN_ATTRS _mm512_set1_pd(double __w)
static __inline__ __m512 __DEFAULT_FN_ATTRS _mm512_maskz_fnmsub_ps(__mmask16 __U, __m512 __A, __m512 __B, __m512 __C)
static __inline__ __m512 __DEFAULT_FN_ATTRS _mm512_mask3_fnmsub_ps(__m512 __A, __m512 __B, __m512 __C, __mmask16 __U)
static __inline __m512d __DEFAULT_FN_ATTRS _mm512_maskz_loadu_pd(__mmask8 __U, void const *__P)
static __inline__ __m512d __DEFAULT_FN_ATTRS _mm512_mask_fmadd_pd(__m512d __A, __mmask8 __U, __m512d __B, __m512d __C)
static __inline void __DEFAULT_FN_ATTRS _mm512_mask_storeu_epi64(void *__P, __mmask8 __U, __m512i __A)
static __inline__ __m512d __DEFAULT_FN_ATTRS _mm512_maskz_fmadd_pd(__mmask8 __U, __m512d __A, __m512d __B, __m512d __C)
static __inline __m512i __DEFAULT_FN_ATTRS _mm512_maskz_loadu_epi32(__mmask16 __U, void const *__P)
static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_andnot_epi32(__m512i __A, __m512i __B)
static __inline __m512 __DEFAULT_FN_ATTRS _mm512_load_ps(double const *__p)
static __inline__ __m512d __DEFAULT_FN_ATTRS _mm512_fmsubadd_pd(__m512d __A, __m512d __B, __m512d __C)
static __inline __m512d __DEFAULT_FN_ATTRS _mm512_loadu_pd(double const *__p)
static __inline __m512i __DEFAULT_FN_ATTRS _mm512_min_epi32(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_add_epi64(__m512i __A, __m512i __B)
static __inline__ __mmask8 __DEFAULT_FN_ATTRS _mm512_mask_cmplt_epi64_mask(__mmask8 __u, __m512i __a, __m512i __b)
static __inline__ __m512d __DEFAULT_FN_ATTRS _mm512_max_pd(__m512d __A, __m512d __B)
static __inline__ __mmask8 __DEFAULT_FN_ATTRS _mm512_mask_cmpgt_epu64_mask(__mmask8 __u, __m512i __a, __m512i __b)
static __inline__ __mmask16 __DEFAULT_FN_ATTRS _mm512_cmpeq_epu32_mask(__m512i __a, __m512i __b)
static __inline__ __m512 __DEFAULT_FN_ATTRS _mm512_maskz_fnmadd_ps(__mmask16 __U, __m512 __A, __m512 __B, __m512 __C)
static __inline __mmask8 __DEFAULT_FN_ATTRS _mm512_test_epi64_mask(__m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_maskz_xor_epi32(__mmask16 __k, __m512i __a, __m512i __b)
static __inline__ __mmask16 __DEFAULT_FN_ATTRS _mm512_mask_cmpgt_epi32_mask(__mmask16 __u, __m512i __a, __m512i __b)
static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_or_si512(__m512i __a, __m512i __b)
static __inline __mmask16 __DEFAULT_FN_ATTRS _mm512_knot(__mmask16 __M)
static __inline __m512i __DEFAULT_FN_ATTRS _mm512_maskz_set1_epi32(__mmask16 __M, int __A)
static __inline __m512i __DEFAULT_FN_ATTRS _mm512_mask_mul_epi32(__m512i __W, __mmask8 __M, __m512i __X, __m512i __Y)
static __inline__ __mmask8 __DEFAULT_FN_ATTRS _mm512_mask_cmpge_epu64_mask(__mmask8 __u, __m512i __a, __m512i __b)
static __inline__ __m512 __DEFAULT_FN_ATTRS _mm512_maskz_fmadd_ps(__mmask16 __U, __m512 __A, __m512 __B, __m512 __C)
static __inline __m512d __DEFAULT_FN_ATTRS _mm512_unpackhi_pd(__m512d __a, __m512d __b)
static __inline__ __mmask16 __DEFAULT_FN_ATTRS _mm512_cmpge_epi32_mask(__m512i __a, __m512i __b)
static __inline__ __mmask8 __DEFAULT_FN_ATTRS _mm512_mask_cmplt_epu64_mask(__mmask8 __u, __m512i __a, __m512i __b)
static __inline void __DEFAULT_FN_ATTRS _mm512_storeu_ps(void *__P, __m512 __A)
static __inline __m512i __DEFAULT_FN_ATTRS _mm512_abs_epi64(__m512i __A)
static __inline__ __m512 __DEFAULT_FN_ATTRS _mm512_mask3_fmaddsub_ps(__m512 __A, __m512 __B, __m512 __C, __mmask16 __U)
static __inline void __DEFAULT_FN_ATTRS _mm512_mask_storeu_ps(void *__P, __mmask16 __U, __m512 __A)
static __inline__ __m512 __DEFAULT_FN_ATTRS _mm512_mask_fnmadd_ps(__m512 __A, __mmask16 __U, __m512 __B, __m512 __C)
static __inline __m512 __DEFAULT_FN_ATTRS _mm512_set1_ps(float __w)
static __inline__ __m512 __DEFAULT_FN_ATTRS _mm512_sqrt_ps(__m512 a)
static __inline__ __m512 __DEFAULT_FN_ATTRS _mm512_mask3_fmadd_ps(__m512 __A, __m512 __B, __m512 __C, __mmask16 __U)
static __inline__ __m512d __DEFAULT_FN_ATTRS _mm512_fmaddsub_pd(__m512d __A, __m512d __B, __m512d __C)
static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_maskz_or_epi32(__mmask16 __k, __m512i __a, __m512i __b)
static __inline__ __mmask8 __DEFAULT_FN_ATTRS _mm512_cmplt_epu64_mask(__m512i __a, __m512i __b)
static __inline__ __m512 __DEFAULT_FN_ATTRS _mm512_mask_fnmsub_ps(__m512 __A, __mmask16 __U, __m512 __B, __m512 __C)
static __inline __m512i __DEFAULT_FN_ATTRS _mm512_max_epu32(__m512i __A, __m512i __B)
static __inline__ __m512 __DEFAULT_FN_ATTRS _mm512_fmaddsub_ps(__m512 __A, __m512 __B, __m512 __C)
static __inline __m512i __DEFAULT_FN_ATTRS _mm512_min_epu32(__m512i __A, __m512i __B)
static __inline__ __m512 __DEFAULT_FN_ATTRS _mm512_fnmadd_ps(__m512 __A, __m512 __B, __m512 __C)
static __inline__ __mmask16 __DEFAULT_FN_ATTRS _mm512_mask_cmplt_epu32_mask(__mmask16 __u, __m512i __a, __m512i __b)
static __inline__ __mmask16 __DEFAULT_FN_ATTRS _mm512_cmple_epi32_mask(__m512i __a, __m512i __b)
static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_or_epi32(__m512i __a, __m512i __b)
static __inline __m512i __DEFAULT_FN_ATTRS _mm512_mullo_epi32(__m512i __A, __m512i __B)
static __inline__ __m512d __DEFAULT_FN_ATTRS _mm512_min_pd(__m512d __A, __m512d __B)
static __inline__ __mmask8 __DEFAULT_FN_ATTRS _mm512_mask_cmple_epi64_mask(__mmask8 __u, __m512i __a, __m512i __b)
static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_mask_add_epi64(__m512i __W, __mmask8 __U, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_and_epi64(__m512i __a, __m512i __b)
static __inline __m256i __DEFAULT_FN_ATTRS _mm512_cvttpd_epi32(__m512d a)
static __inline__ __mmask8 __DEFAULT_FN_ATTRS _mm512_mask_cmpeq_epi64_mask(__mmask8 __u, __m512i __a, __m512i __b)
static __inline __m512i __DEFAULT_FN_ATTRS _mm512_mask_mul_epu32(__m512i __W, __mmask8 __M, __m512i __X, __m512i __Y)
static __inline__ __m128 __DEFAULT_FN_ATTRS _mm_rsqrt14_ss(__m128 __A, __m128 __B)
static __inline __m512d __DEFAULT_FN_ATTRS _mm512_ceil_pd(__m512d __A)
static vector float vector float __b
static __inline__ __m512d __DEFAULT_FN_ATTRS _mm512_rsqrt14_pd(__m512d __A)
static __inline__ __mmask16 __DEFAULT_FN_ATTRS _mm512_cmple_epu32_mask(__m512i __a, __m512i __b)
static __inline__ __m512d __DEFAULT_FN_ATTRS _mm512_fnmadd_pd(__m512d __A, __m512d __B, __m512d __C)
static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_maskz_and_epi32(__mmask16 __k, __m512i __a, __m512i __b)
static __inline __m512d __DEFAULT_FN_ATTRS _mm512_maskz_load_pd(__mmask8 __U, void const *__P)
static __inline__ __mmask8 __DEFAULT_FN_ATTRS _mm512_cmpge_epu64_mask(__m512i __a, __m512i __b)
static __inline __m512d __DEFAULT_FN_ATTRS _mm512_mask_blend_pd(__mmask8 __U, __m512d __A, __m512d __W)
static __inline__ __m128 __DEFAULT_FN_ATTRS _mm_rcp14_ss(__m128 __A, __m128 __B)
static __inline__ __mmask8 __DEFAULT_FN_ATTRS _mm512_cmplt_epi64_mask(__m512i __a, __m512i __b)
static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_maskz_andnot_epi64(__mmask8 __U, __m512i __A, __m512i __B)
static __inline__ __m512d __DEFAULT_FN_ATTRS _mm512_fmsub_pd(__m512d __A, __m512d __B, __m512d __C)
static __inline __m512i __DEFAULT_FN_ATTRS _mm512_maskz_mul_epi32(__mmask8 __M, __m512i __X, __m512i __Y)
static __inline__ __mmask8 __DEFAULT_FN_ATTRS _mm512_mask_cmpgt_epi64_mask(__mmask8 __u, __m512i __a, __m512i __b)
static __inline__ __mmask8 __DEFAULT_FN_ATTRS _mm512_cmpneq_epu64_mask(__m512i __a, __m512i __b)
static __inline __m512d __DEFAULT_FN_ATTRS _mm512_mul_pd(__m512d __a, __m512d __b)
static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_maskz_sub_epi64(__mmask8 __U, __m512i __A, __m512i __B)
static __inline __m512 __DEFAULT_FN_ATTRS _mm512_castps256_ps512(__m256 __a)
static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_xor_epi64(__m512i __a, __m512i __b)
static __inline__ __m512d __DEFAULT_FN_ATTRS _mm512_broadcastsd_pd(__m128d __X)
static __inline __m128d __DEFAULT_FN_ATTRS _mm512_castpd512_pd128(__m512d __a)
static __inline __m512d __DEFAULT_FN_ATTRS _mm512_castpd256_pd512(__m256d __a)
static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_mask_add_epi32(__m512i __W, __mmask16 __U, __m512i __A, __m512i __B)
static __inline__ __mmask8 __DEFAULT_FN_ATTRS _mm512_mask_cmpeq_epu64_mask(__mmask8 __u, __m512i __a, __m512i __b)
static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_mask_or_epi64(__m512i __src, __mmask8 __k, __m512i __a, __m512i __b)
static __inline__ __mmask16 __DEFAULT_FN_ATTRS _mm512_mask_cmpneq_epi32_mask(__mmask16 __u, __m512i __a, __m512i __b)
static __inline __m512d __DEFAULT_FN_ATTRS _mm512_cvtepi32_pd(__m256i __A)
static __inline __m512d __DEFAULT_FN_ATTRS _mm512_add_pd(__m512d __a, __m512d __b)
static __inline__ __m512 __DEFAULT_FN_ATTRS _mm512_fmadd_ps(__m512 __A, __m512 __B, __m512 __C)
static __inline__ __mmask16 __DEFAULT_FN_ATTRS _mm512_mask_cmpeq_epu32_mask(__mmask16 __u, __m512i __a, __m512i __b)
#define _MM_FROUND_CUR_DIRECTION
static __inline__ __mmask8 __DEFAULT_FN_ATTRS _mm512_cmple_epi64_mask(__m512i __a, __m512i __b)
static __inline__ __m512d __DEFAULT_FN_ATTRS _mm512_maskz_fnmadd_pd(__mmask8 __U, __m512d __A, __m512d __B, __m512d __C)
static __inline __mmask16 __DEFAULT_FN_ATTRS _mm512_test_epi32_mask(__m512i __A, __m512i __B)
static __inline__ __m512 __DEFAULT_FN_ATTRS _mm512_mask_fmadd_ps(__m512 __A, __mmask16 __U, __m512 __B, __m512 __C)
static __inline__ __mmask8 __DEFAULT_FN_ATTRS _mm512_mask_cmple_epu64_mask(__mmask8 __u, __m512i __a, __m512i __b)
static __inline__ __mmask8 __DEFAULT_FN_ATTRS _mm512_mask_cmpneq_epu64_mask(__mmask8 __u, __m512i __a, __m512i __b)
static __inline __m512d __DEFAULT_FN_ATTRS _mm512_permutex2var_pd(__m512d __A, __m512i __I, __m512d __B)
static __inline __m512 __DEFAULT_FN_ATTRS _mm512_mask_blend_ps(__mmask16 __U, __m512 __A, __m512 __W)
static __inline__ __mmask8 __DEFAULT_FN_ATTRS _mm512_cmpge_epi64_mask(__m512i __a, __m512i __b)
static __inline __m512i __DEFAULT_FN_ATTRS _mm512_maskz_mul_epu32(__mmask8 __M, __m512i __X, __m512i __Y)
static __inline void __DEFAULT_FN_ATTRS _mm512_store_pd(void *__P, __m512d __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_sub_epi64(__m512i __A, __m512i __B)
static __inline__ __m512 __DEFAULT_FN_ATTRS _mm512_maskz_fmsubadd_ps(__mmask16 __U, __m512 __A, __m512 __B, __m512 __C)
static __inline__ __m512d __DEFAULT_FN_ATTRS _mm512_maskz_fmsubadd_pd(__mmask8 __U, __m512d __A, __m512d __B, __m512d __C)
static __inline __m512i __DEFAULT_FN_ATTRS _mm512_set1_epi64(long long __d)
static __inline __m512 __DEFAULT_FN_ATTRS _mm512_floor_ps(__m512 __A)
static __inline__ __m512d __DEFAULT_FN_ATTRS _mm512_mask3_fmsub_pd(__m512d __A, __m512d __B, __m512d __C, __mmask8 __U)
static __inline__ __mmask8 __DEFAULT_FN_ATTRS _mm512_mask_cmpneq_epi64_mask(__mmask8 __u, __m512i __a, __m512i __b)
static __inline__ __m512d __DEFAULT_FN_ATTRS _mm512_mask3_fmaddsub_pd(__m512d __A, __m512d __B, __m512d __C, __mmask8 __U)
static __inline __m512i __DEFAULT_FN_ATTRS _mm512_mask_mullo_epi32(__m512i __W, __mmask16 __M, __m512i __A, __m512i __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_and_si512(__m512i __a, __m512i __b)
static __inline __m512i __DEFAULT_FN_ATTRS _mm512_setzero_si512(void)
static __inline__ __m128d __DEFAULT_FN_ATTRS _mm_rsqrt14_sd(__m128d __A, __m128d __B)
static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_mask_and_epi64(__m512i __src, __mmask8 __k, __m512i __a, __m512i __b)
static __inline __m512d __DEFAULT_FN_ATTRS _mm512_sub_pd(__m512d __a, __m512d __b)
static __inline__ __m512 __DEFAULT_FN_ATTRS _mm512_mask3_fnmadd_ps(__m512 __A, __m512 __B, __m512 __C, __mmask16 __U)
static __inline__ __m512 __DEFAULT_FN_ATTRS _mm512_maskz_fmaddsub_ps(__mmask16 __U, __m512 __A, __m512 __B, __m512 __C)
static __inline __m512i __DEFAULT_FN_ATTRS _mm512_mul_epi32(__m512i __X, __m512i __Y)
static __inline__ __m512d __DEFAULT_FN_ATTRS _mm512_mask_fmsubadd_pd(__m512d __A, __mmask8 __U, __m512d __B, __m512d __C)
#define __DEFAULT_FN_ATTRS
static __inline __m512d __DEFAULT_FN_ATTRS _mm512_load_pd(float const *__p)
static __inline__ __m512 __DEFAULT_FN_ATTRS _mm512_fmsubadd_ps(__m512 __A, __m512 __B, __m512 __C)
static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_xor_epi32(__m512i __a, __m512i __b)
static __inline __m256i __DEFAULT_FN_ATTRS _mm256_setzero_si256(void)
static __inline__ __m512d __DEFAULT_FN_ATTRS _mm512_mask3_fmsubadd_pd(__m512d __A, __m512d __B, __m512d __C, __mmask8 __U)
static __inline __m512 __DEFAULT_FN_ATTRS _mm512_ceil_ps(__m512 __A)
static __inline__ __m512 __DEFAULT_FN_ATTRS _mm512_fmsub_ps(__m512 __A, __m512 __B, __m512 __C)
static __inline__ __m512d __DEFAULT_FN_ATTRS _mm512_mask_fmsub_pd(__m512d __A, __mmask8 __U, __m512d __B, __m512d __C)
static __inline __m512i __DEFAULT_FN_ATTRS _mm512_cvttps_epu32(__m512 __A)
static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_mask_or_epi32(__m512i __src, __mmask16 __k, __m512i __a, __m512i __b)
static __inline__ __mmask16 __DEFAULT_FN_ATTRS _mm512_mask_cmpneq_epu32_mask(__mmask16 __u, __m512i __a, __m512i __b)
static __inline__ __m512 __DEFAULT_FN_ATTRS _mm512_rcp14_ps(__m512 __A)
static __inline void __DEFAULT_FN_ATTRS _mm512_mask_storeu_epi32(void *__P, __mmask16 __U, __m512i __A)
static __inline __m512 __DEFAULT_FN_ATTRS _mm512_permutex2var_ps(__m512 __A, __m512i __I, __m512 __B)
static __inline__ __m512 __DEFAULT_FN_ATTRS _mm512_maskz_fmsub_ps(__mmask16 __U, __m512 __A, __m512 __B, __m512 __C)
static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_mask_sub_epi32(__m512i __W, __mmask16 __U, __m512i __A, __m512i __B)
static __inline__ __mmask16 __DEFAULT_FN_ATTRS _mm512_cmpge_epu32_mask(__m512i __a, __m512i __b)
static __inline__ __mmask16 __DEFAULT_FN_ATTRS _mm512_cmpneq_epi32_mask(__m512i __a, __m512i __b)
static __inline__ __m512 __DEFAULT_FN_ATTRS _mm512_broadcastss_ps(__m128 __X)
static __inline __m512i __DEFAULT_FN_ATTRS _mm512_max_epu64(__m512i __A, __m512i __B)
static __inline __m512 __DEFAULT_FN_ATTRS _mm512_mul_ps(__m512 __a, __m512 __b)
static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_add_epi32(__m512i __A, __m512i __B)
static __inline__ __mmask16 __DEFAULT_FN_ATTRS _mm512_cmplt_epu32_mask(__m512i __a, __m512i __b)
static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_mask_andnot_epi64(__m512i __W, __mmask8 __U, __m512i __A, __m512i __B)
static __inline __m512i __DEFAULT_FN_ATTRS _mm512_permutex2var_epi32(__m512i __A, __m512i __I, __m512i __B)
static __inline __m512i __DEFAULT_FN_ATTRS _mm512_cvttps_epi32(__m512 a)
static __inline__ __m512 __DEFAULT_FN_ATTRS _mm512_mask_fmaddsub_ps(__m512 __A, __mmask16 __U, __m512 __B, __m512 __C)
static __inline__ __mmask16 __DEFAULT_FN_ATTRS _mm512_mask_cmpeq_epi32_mask(__mmask16 __u, __m512i __a, __m512i __b)
static __inline__ __m512 __DEFAULT_FN_ATTRS _mm512_max_ps(__m512 __A, __m512 __B)
static __inline__ __m512d __DEFAULT_FN_ATTRS _mm512_mask_fnmadd_pd(__m512d __A, __mmask8 __U, __m512d __B, __m512d __C)
static __inline__ __m512d __DEFAULT_FN_ATTRS _mm512_mask3_fnmadd_pd(__m512d __A, __m512d __B, __m512d __C, __mmask8 __U)
static __inline __m512d __DEFAULT_FN_ATTRS _mm512_unpacklo_pd(__m512d __a, __m512d __b)
static __inline __m512i __DEFAULT_FN_ATTRS _mm512_abs_epi32(__m512i __A)
static __inline void __DEFAULT_FN_ATTRS _mm512_mask_storeu_pd(void *__P, __mmask8 __U, __m512d __A)
static __inline __m512 __DEFAULT_FN_ATTRS _mm512_maskz_loadu_ps(__mmask16 __U, void const *__P)
double __v8df __attribute__((__vector_size__(64)))
static __inline__ __mmask16 __DEFAULT_FN_ATTRS _mm512_mask_cmpge_epi32_mask(__mmask16 __u, __m512i __a, __m512i __b)
static __inline__ __m512i __DEFAULT_FN_ATTRS _mm512_mask_xor_epi64(__m512i __src, __mmask8 __k, __m512i __a, __m512i __b)
static __inline__ __mmask16 __DEFAULT_FN_ATTRS _mm512_mask_cmple_epu32_mask(__mmask16 __u, __m512i __a, __m512i __b)
static __inline void __DEFAULT_FN_ATTRS _mm512_store_ps(void *__P, __m512 __A)
static __inline__ __m512d __DEFAULT_FN_ATTRS _mm512_sqrt_pd(__m512d a)
static __inline__ __mmask16 __DEFAULT_FN_ATTRS _mm512_cmplt_epi32_mask(__m512i __a, __m512i __b)
static __inline __m512i __DEFAULT_FN_ATTRS _mm512_max_epi32(__m512i __A, __m512i __B)