/* { dg-do run } */ /* { dg-options "-O2 -mavx512ifma" } */ /* { dg-require-effective-target avx512ifma } */ #define AVX512IFMA #include "avx512f-helper.h" #define SIZE (AVX512F_LEN / 64) #include "avx512f-mask-type.h" void CALC (unsigned long long *r, unsigned long long *s1, unsigned long long *s2, unsigned long long *s3) { int i; /* Valid, because values are less than 1 << 26. */ for (i = 0; i < SIZE; i++) r[i] = s2[i] * s3[i] + s1[i]; } void TEST (void) { UNION_TYPE (AVX512F_LEN, i_q) src1, src2, dst1, dst2, dst3; unsigned long long dst_ref[SIZE]; int i; MASK_TYPE mask = MASK_VALUE; for (i = 0; i < SIZE; i++) { src1.a[i] = i + 50; src2.a[i] = i + 100; dst1.a[i] = DEFAULT_VALUE; dst2.a[i] = DEFAULT_VALUE; dst3.a[i] = DEFAULT_VALUE; } CALC (dst_ref, dst1.a, src1.a, src2.a); dst1.x = INTRINSIC (_madd52lo_epu64) (dst1.x, src1.x, src2.x); dst2.x = INTRINSIC (_mask_madd52lo_epu64) (dst2.x, mask, src1.x, src2.x); dst3.x = INTRINSIC (_maskz_madd52lo_epu64) (mask, dst3.x, src1.x, src2.x); if (UNION_CHECK (AVX512F_LEN, i_q) (dst1, dst_ref)) abort (); MASK_MERGE (i_q) (dst_ref, mask, SIZE); if (UNION_CHECK (AVX512F_LEN, i_q) (dst2, dst_ref)) abort (); MASK_ZERO (i_q) (dst_ref, mask, SIZE); if (UNION_CHECK (AVX512F_LEN, i_q) (dst3, dst_ref)) abort (); }