/* { dg-do run } */ /* { dg-options "-O2 -mavx512f -std=c99" } */ /* { dg-require-effective-target avx512f } */ /* { dg-require-effective-target c99_runtime } */ #define AVX512F #include "avx512f-helper.h" #include #define SIZE (AVX512F_LEN / 64) #include "avx512f-mask-type.h" #undef SUF #undef SSIZE #undef GEN_CMP #undef CHECK_CMP #if AVX512F_LEN == 512 #define SUF(fun) _mm512##fun #define SSIZE 8 #define GEN_CMP(type) \ { \ dst3 = _mm512_cmp##type##_pd_mask(source1.x, source2.x);\ dst4 = _mm512_mask_cmp##type##_pd_mask(mask, source1.x, source2.x);\ if (dst3 != dst1) abort(); \ if (dst4 != dst2) abort(); \ } #define CHECK_CMP(imm) \ if (imm == _CMP_EQ_OQ) GEN_CMP(eq) \ if (imm == _CMP_LT_OS) GEN_CMP(lt) \ if (imm == _CMP_LE_OS) GEN_CMP(le) \ if (imm == _CMP_UNORD_Q) GEN_CMP(unord) \ if (imm == _CMP_NEQ_UQ) GEN_CMP(neq) \ if (imm == _CMP_NLT_US) GEN_CMP(nlt) \ if (imm == _CMP_NLE_US) GEN_CMP(nle) \ if (imm == _CMP_ORD_Q) GEN_CMP(ord) #endif #if AVX512F_LEN == 256 #define SUF(fun) _mm256##fun #define SSIZE 4 #define GEN_CMP(type) #define CHECK_CMP(imm) #endif #if AVX512F_LEN == 128 #define SUF(fun) _mm##fun #define SSIZE 2 #define GEN_CMP(type) #define CHECK_CMP(imm) #endif #undef CMP #define CMP(imm, rel) \ dst_ref = 0; \ for (i = 0; i < SSIZE; i++) \ { \ dst_ref = (((int) rel) << i) | dst_ref; \ } \ source1.x = SUF(_loadu_pd)(s1); \ source2.x = SUF(_loadu_pd)(s2); \ dst1 = SUF(_cmp_pd_mask)(source1.x, source2.x, imm);\ dst2 = SUF(_mask_cmp_pd_mask)(mask, source1.x, source2.x, imm);\ if (dst_ref != dst1) abort(); \ if ((dst_ref & mask) != dst2) abort(); \ CHECK_CMP(imm) void TEST () { UNION_TYPE (AVX512F_LEN, d) source1, source2; MASK_TYPE dst1, dst2, dst3, dst4, dst_ref; MASK_TYPE mask = MASK_VALUE; int i; double s1[8]={2134.3343, 6678.346, 453.345635, 54646.464, 231.23311, 5674.455, 111.111111, 23241.152}; double s2[8]={41124.234, 6678.346, 8653.65635, 856.43576, 231.23311, 4646.123, 111.111111, 124.12455}; CMP(_CMP_EQ_OQ, !isunordered(s1[i], s2[i]) && s1[i] == s2[i]); CMP(_CMP_LT_OS, !isunordered(s1[i], s2[i]) && s1[i] < s2[i]); CMP(_CMP_LE_OS, !isunordered(s1[i], s2[i]) && s1[i] <= s2[i]); CMP(_CMP_UNORD_Q, isunordered(s1[i], s2[i])); CMP(_CMP_NEQ_UQ, isunordered(s1[i], s2[i]) || s1[i] != s2[i]); CMP(_CMP_NLT_US, isunordered(s1[i], s2[i]) || s1[i] >= s2[i]); CMP(_CMP_NLE_US, isunordered(s1[i], s2[i]) || s1[i] > s2[i]); CMP(_CMP_ORD_Q, !isunordered(s1[i], s2[i])); CMP(_CMP_EQ_UQ, isunordered(s1[i], s2[i]) || s1[i] == s2[i]); CMP(_CMP_NGE_US, isunordered(s1[i], s2[i]) || s1[i] < s2[i]); CMP(_CMP_NGT_US, isunordered(s1[i], s2[i]) || s1[i] <= s2[i]); CMP(_CMP_FALSE_OQ, 0); CMP(_CMP_NEQ_OQ, !isunordered(s1[i], s2[i]) && s1[i] != s2[i]); CMP(_CMP_GE_OS, !isunordered(s1[i], s2[i]) && s1[i] >= s2[i]); CMP(_CMP_GT_OS, !isunordered(s1[i], s2[i]) && s1[i] > s2[i]); CMP(_CMP_TRUE_UQ, 1); CMP(_CMP_EQ_OS, !isunordered(s1[i], s2[i]) && s1[i] == s2[i]); CMP(_CMP_LT_OQ, !isunordered(s1[i], s2[i]) && s1[i] < s2[i]); CMP(_CMP_LE_OQ, !isunordered(s1[i], s2[i]) && s1[i] <= s2[i]); CMP(_CMP_UNORD_S, isunordered(s1[i], s2[i])); CMP(_CMP_NEQ_US, isunordered(s1[i], s2[i]) || s1[i] != s2[i]); CMP(_CMP_NLT_UQ, isunordered(s1[i], s2[i]) || s1[i] >= s2[i]); CMP(_CMP_NLE_UQ, isunordered(s1[i], s2[i]) || s1[i] > s2[i]); CMP(_CMP_ORD_S, !isunordered(s1[i], s2[i])); CMP(_CMP_EQ_US, isunordered(s1[i], s2[i]) || s1[i] == s2[i]); CMP(_CMP_NGE_UQ, isunordered(s1[i], s2[i]) || s1[i] < s2[i]); CMP(_CMP_NGT_UQ, isunordered(s1[i], s2[i]) || s1[i] <= s2[i]); CMP(_CMP_FALSE_OS, 0); CMP(_CMP_NEQ_OS, !isunordered(s1[i], s2[i]) && s1[i] != s2[i]); CMP(_CMP_GE_OQ, !isunordered(s1[i], s2[i]) && s1[i] >= s2[i]); CMP(_CMP_GT_OQ, !isunordered(s1[i], s2[i]) && s1[i] > s2[i]); CMP(_CMP_TRUE_US, 1) }