summaryrefslogtreecommitdiff
path: root/gcc/testsuite/gcc.target/aarch64/sve_vec_perm_1_overrange_run.c
blob: 1b98389d9962080b7a3f12d58ba0d9a9b986a207 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
/* { dg-do run { target aarch64_sve_hw } } */
/* { dg-options "-O -march=armv8-a+sve" } */
/* { dg-options "-O -march=armv8-a+sve -msve-vector-bits=256" { target aarch64_sve256_hw } } */

#include "sve_vec_perm_1.c"

#define TEST_VEC_PERM(TYPE, MASK_TYPE, EXPECTED_RESULT,			\
		      VALUES1, VALUES2, MASK)				\
{									\
  TYPE expected_result = EXPECTED_RESULT;				\
  TYPE values1 = VALUES1;						\
  TYPE values2 = VALUES2;						\
  MASK_TYPE mask = MASK;						\
  TYPE dest;								\
  dest = vec_perm_##TYPE (values1, values2, mask);			\
  if (__builtin_memcmp (&dest, &expected_result, sizeof (TYPE)) != 0)	\
    __builtin_abort ();							\
}

int main (void)
{
  TEST_VEC_PERM (vnx2di, vnx2di,
		 ((vnx2di) { 5, 36, 7, 48 }),
		 ((vnx2di) { 4, 5, 6, 7 }),
		 ((vnx2di) { 12, 24, 36, 48 }),
		 ((vnx2di) { 1 + (8 * 1), 6 + (8 * 3),
			     3 + (8 * 1), 7 + (8 * 5) }));
  TEST_VEC_PERM (vnx4si, vnx4si,
		 ((vnx4si) { 34, 38, 40, 10, 9, 8, 7, 35 }),
		 ((vnx4si) { 3, 4, 5, 6, 7, 8, 9, 10 }),
		 ((vnx4si) { 33, 34, 35, 36, 37, 38, 39, 40 }),
		 ((vnx4si) { 9 + (16 * 2), 13 + (16 * 5),
			     15 + (16 * 1), 7 + (16 * 0),
			     6 + (16 * 8), 5 + (16 * 2),
			     4 + (16 * 3), 10 + (16 * 2) }));
  TEST_VEC_PERM (vnx8hi, vnx8hi,
		 ((vnx8hi) { 12, 16, 18, 10, 42, 43, 44, 34,
			     7, 48, 3, 35, 9, 8, 7, 13 }),
		 ((vnx8hi) { 3, 4, 5, 6, 7, 8, 9, 10,
			     11, 12, 13, 14, 15, 16, 17, 18 }),
		 ((vnx8hi) { 33, 34, 35, 36, 37, 38, 39, 40,
			     41, 42, 43, 44, 45, 46, 47, 48 }),
		 ((vnx8hi) { 9 + (32 * 2), 13 + (32 * 2),
			     15 + (32 * 8), 7 + (32 * 9),
			     25 + (32 * 4), 26 + (32 * 3),
			     27 + (32 * 1), 17 + (32 * 2),
			     4 + (32 * 6), 31 + (32 * 7),
			     0 + (32 * 8), 18 + (32 * 9),
			     6 + (32 * 6), 5 + (32 * 7),
			     4 + (32 * 2), 10 + (32 * 2) }));
  TEST_VEC_PERM (vnx16qi, vnx16qi,
		 ((vnx16qi) { 5, 6, 7, 4, 5, 6, 4, 5,
			      6, 7, 12, 24, 36, 48, 12, 24,
			      5, 6, 7, 4, 5, 6, 4, 5,
			      6, 7, 12, 24, 36, 48, 12, 24 }),
		 ((vnx16qi) { 4, 5, 6, 7, 4, 5, 6, 7,
			      4, 5, 6, 7, 4, 5, 6, 7,
			      4, 5, 6, 7, 4, 5, 6, 7,
			      4, 5, 6, 7, 4, 5, 6, 7 }),
		 ((vnx16qi) { 12, 24, 36, 48, 12, 24, 36, 48,
			      12, 24, 36, 48, 12, 24, 36, 48,
			      12, 24, 36, 48, 12, 24, 36, 48,
			      12, 24, 36, 48, 12, 24, 36, 48 }),
		 ((vnx16qi) { 5 + (64 * 3), 6 + (64 * 1),
			      7 + (64 * 2), 8 + (64 * 1),
			      9 + (64 * 3), 10 + (64 * 1),
			      28 + (64 * 3), 29 + (64 * 3),
			      30 + (64 * 1), 31 + (64 * 1),
			      32 + (64 * 3), 33 + (64 * 2),
			      54 + (64 * 2), 55 + (64 * 2),
			      56 + (64 * 1), 61 + (64 * 2),
			      5 + (64 * 2), 6 + (64 * 1),
			      7 + (64 * 2), 8 + (64 * 2),
			      9 + (64 * 2), 10 + (64 * 1),
			      28 + (64 * 3), 29 + (64 * 1),
			      30 + (64 * 3), 31 + (64 * 3),
			      32 + (64 * 1), 33 + (64 * 1),
			      54 + (64 * 2), 55 + (64 * 2),
			      56 + (64 * 2), 61 + (64 * 2) }));
  TEST_VEC_PERM (vnx2df, vnx2di,
		 ((vnx2df) { 5.1, 36.1, 7.1, 48.1 }),
		 ((vnx2df) { 4.1, 5.1, 6.1, 7.1 }),
		 ((vnx2df) { 12.1, 24.1, 36.1, 48.1 }),
		 ((vnx2di) { 1 + (8 * 3), 6 + (8 * 10),
			     3 + (8 * 8), 7 + (8 * 2) }));
  TEST_VEC_PERM (vnx4sf, vnx4si,
		 ((vnx4sf) { 34.2, 38.2, 40.2, 10.2, 9.2, 8.2, 7.2, 35.2 }),
		 ((vnx4sf) { 3.2, 4.2, 5.2, 6.2, 7.2, 8.2, 9.2, 10.2 }),
		 ((vnx4sf) { 33.2, 34.2, 35.2, 36.2,
			     37.2, 38.2, 39.2, 40.2 }),
		 ((vnx4si) { 9 + (16 * 1), 13 + (16 * 5),
			     15 + (16 * 4), 7 + (16 * 4),
			     6 + (16 * 3), 5 + (16 * 2),
			     4 + (16 * 1), 10 + (16 * 0) }));
  TEST_VEC_PERM (vnx8hf, vnx8hi,
		 ((vnx8hf) { 12.0, 16.0, 18.0, 10.0, 42.0, 43.0, 44.0, 34.0,
			     7.0, 48.0, 3.0, 35.0, 9.0, 8.0, 7.0, 13.0 }),
		 ((vnx8hf) { 3.0, 4.0, 5.0, 6.0, 7.0, 8.0, 9.0, 10.0,
			     11.0, 12.0, 13.0, 14.0, 15.0, 16.0, 17.0, 18.0 }),
		 ((vnx8hf) { 33.0, 34.0, 35.0, 36.0, 37.0, 38.0, 39.0, 40.0,
			     41.0, 42.0, 43.0, 44.0, 45.0, 46.0, 47.0, 48.0 }),
		 ((vnx8hi) { 9 + (32 * 2), 13 + (32 * 2),
			     15 + (32 * 8), 7 + (32 * 9),
			     25 + (32 * 4), 26 + (32 * 3),
			     27 + (32 * 1), 17 + (32 * 2),
			     4 + (32 * 6), 31 + (32 * 7),
			     0 + (32 * 8), 18 + (32 * 9),
			     6 + (32 * 6), 5 + (32 * 7),
			     4 + (32 * 2), 10 + (32 * 2) }));
  return 0;
}