1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
|
/* { dg-do compile } */
/* { dg-options "-O2 -ftree-vectorize -ffast-math -march=armv8-a+sve" } */
#define TEST_LOOP(NAME, OUTTYPE, INTYPE, MASKTYPE) \
void __attribute__ ((noinline, noclone)) \
NAME##_3 (OUTTYPE *__restrict dest, INTYPE *__restrict src, \
MASKTYPE *__restrict cond, int n) \
{ \
for (int i = 0; i < n; ++i) \
if (cond[i]) \
dest[i] = (src[i * 3] \
+ src[i * 3 + 1] \
+ src[i * 3 + 2]); \
}
#define TEST2(NAME, OUTTYPE, INTYPE) \
TEST_LOOP (NAME##_i8, OUTTYPE, INTYPE, signed char) \
TEST_LOOP (NAME##_i16, OUTTYPE, INTYPE, unsigned short) \
TEST_LOOP (NAME##_f32, OUTTYPE, INTYPE, float) \
TEST_LOOP (NAME##_f64, OUTTYPE, INTYPE, double)
#define TEST1(NAME, OUTTYPE) \
TEST2 (NAME##_i8, OUTTYPE, signed char) \
TEST2 (NAME##_i16, OUTTYPE, unsigned short) \
TEST2 (NAME##_i32, OUTTYPE, int) \
TEST2 (NAME##_i64, OUTTYPE, unsigned long)
#define TEST(NAME) \
TEST1 (NAME##_i8, signed char) \
TEST1 (NAME##_i16, unsigned short) \
TEST1 (NAME##_i32, int) \
TEST1 (NAME##_i64, unsigned long) \
TEST2 (NAME##_f16_f16, _Float16, _Float16) \
TEST2 (NAME##_f32_f32, float, float) \
TEST2 (NAME##_f64_f64, double, double)
TEST (test)
/* Mask | 8 16 32 64
-------+------------
Out 8 | 1 1 1 1
16 | 1 1 1 1
32 | 1 1 1 1
64 | 1 1 1 1. */
/* { dg-final { scan-assembler-times {\tld3b\t.z[0-9]} 16 } } */
/* Mask | 8 16 32 64
-------+------------
Out 8 | 2 2 2 2
16 | 2 1 1 1 x2 (for _Float16)
32 | 2 1 1 1
64 | 2 1 1 1. */
/* { dg-final { scan-assembler-times {\tld3h\t.z[0-9]} 28 } } */
/* Mask | 8 16 32 64
-------+------------
Out 8 | 4 4 4 4
16 | 4 2 2 2
32 | 4 2 1 1 x2 (for float)
64 | 4 2 1 1. */
/* { dg-final { scan-assembler-times {\tld3w\t.z[0-9]} 50 } } */
/* Mask | 8 16 32 64
-------+------------
Out 8 | 8 8 8 8
16 | 8 4 4 4
32 | 8 4 2 2
64 | 8 4 2 1 x2 (for double). */
/* { dg-final { scan-assembler-times {\tld3d\t.z[0-9]} 98 } } */
|