1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
|
/* { dg-do run } */
/* { dg-options "-O3 -mpower8-vector -Wno-psabi" } */
/* { dg-require-effective-target lp64 } */
/* { dg-require-effective-target p8vector_hw } */
#ifndef CHECK_H
#define CHECK_H "sse2-check.h"
#endif
#include CHECK_H
#ifndef TEST
#define TEST sse2_test_paddusb_1
#endif
#include <emmintrin.h>
static __m128i
__attribute__((noinline, unused))
test (__m128i s1, __m128i s2)
{
__asm("" : "+v"(s1), "+v"(s2));
return _mm_adds_epu8 (s1, s2);
}
static void
TEST (void)
{
union128i_b u, s1, s2;
char e[16] = {0};
int i, tmp;
s1.x = _mm_set_epi8 (30, 2, 3, 4, 10, 20, 30, 90, 80, 40, 100, 15, 98, 25, 98, 7);
s2.x = _mm_set_epi8 (88, 44, 33, 22, 11, 98, 76, 100, 34, 78, 39, 6, 3, 4, 5, 119);
u.x = test (s1.x, s2.x);
for (i = 0; i < 16; i++)
{
tmp = (unsigned char)s1.a[i] + (unsigned char)s2.a[i];
if (tmp > 255)
tmp = -1;
if (tmp < 0)
tmp = 0;
e[i] = tmp;
}
if (check_union128i_b (u, e))
#if DEBUG
{
printf ("sse2_test_paddusb_1; check_union128i_b failed\n");
printf (
"\tadds\t([%x,%x,%x,%x, %x,%x,%x,%x, %x,%x,%x,%x, %x,%x,%x,%x],\n",
s1.a[0], s1.a[1], s1.a[2], s1.a[3], s1.a[4], s1.a[5], s1.a[6],
s1.a[7], s1.a[8], s1.a[9], s1.a[10], s1.a[11], s1.a[12], s1.a[13],
s1.a[14], s1.a[15]);
printf ("\t\t [%x,%x,%x,%x, %x,%x,%x,%x, %x,%x,%x,%x, %x,%x,%x,%x])\n",
s2.a[0], s2.a[1], s2.a[2], s2.a[3], s2.a[4], s2.a[5], s2.a[6],
s2.a[7], s2.a[8], s2.a[9], s2.a[10], s2.a[11], s2.a[12], s2.a[13],
s2.a[14], s2.a[15]);
printf ("\t ->\t [%x,%x,%x,%x, %x,%x,%x,%x, %x,%x,%x,%x, %x,%x,%x,%x]\n",
u.a[0], u.a[1], u.a[2], u.a[3], u.a[4], u.a[5], u.a[6], u.a[7],
u.a[8], u.a[9], u.a[10], u.a[11], u.a[12], u.a[13], u.a[14],
u.a[15]);
printf (
"\texpect\t [%x,%x,%x,%x, %x,%x,%x,%x, %x,%x,%x,%x, %x,%x,%x,%x]\n",
e[0], e[1], e[2], e[3], e[4], e[5], e[6], e[7], e[8], e[9], e[10],
e[11], e[12], e[13], e[14], e[15]);
}
#else
abort ();
#endif
}
|