/* { dg-do run } */ /* { dg-options "-O2 -mavx512f" } */ /* { dg-require-effective-target avx512f } */ #include "avx512f-check.h" #include "avx512f-helper.h" #define SIZE (128 / 32) #include "avx512f-mask-type.h" void avx512f_test (void) { int i, sign; union128 res1, res2, res3, res4, src1, src2, src3; volatile __mmask8 mask = 5; float val[2] = { 35.5f, 0.0f }; float *volatile p = &val[0]; float res_ref[SIZE]; float zero[SIZE]; for (i = 0; i < SIZE; i++) { src1.a[i] = 1.5f + i; src2.a[i] = 7.5f + i; src3.a[i] = 4.5f + i; zero[i] = 0.0f; } res1.x = _mm_mask_load_ss (src1.x, mask, p); res2.x = _mm_maskz_load_ss (mask, p); __builtin_memcpy (res_ref, zero, sizeof (zero)); res_ref[0] = val[0]; if (check_union128 (res1, res_ref)) abort (); if (check_union128 (res2, res_ref)) abort (); res3.x = _mm_mask_move_ss (src1.x, mask, src2.x, src3.x); res4.x = _mm_maskz_move_ss (mask, src2.x, src3.x); __builtin_memcpy (res_ref, src2.a, sizeof (src2.a)); res_ref[0] = src3.a[0]; if (check_union128 (res3, res_ref)) abort (); if (check_union128 (res4, res_ref)) abort (); _mm_mask_store_ss (p + 1, mask, src1.x); if (val[1] != src1.a[0]) abort (); mask ^= 1; res1.x = _mm_mask_load_ss (src1.x, mask, p); res2.x = _mm_maskz_load_ss (mask, p); __builtin_memcpy (res_ref, zero, sizeof (zero)); res_ref[0] = src1.a[0]; if (check_union128 (res1, res_ref)) abort (); res_ref[0] = zero[0]; if (check_union128 (res2, res_ref)) abort (); res3.x = _mm_mask_move_ss (src1.x, mask, src2.x, src3.x); res4.x = _mm_maskz_move_ss (mask, src2.x, src3.x); __builtin_memcpy (res_ref, src2.a, sizeof (src2.a)); res_ref[0] = src1.a[0]; if (check_union128 (res3, res_ref)) abort (); res_ref[0] = zero[0]; if (check_union128 (res4, res_ref)) abort (); val[1] = 42.0f; _mm_mask_store_ss (p + 1, mask, src1.x); if (val[1] != 42.0f) abort (); }