1 /* { dg-do run } */
2 /* { dg-require-effective-target p8vector_hw } */
3 /* { dg-options "-O2 -mpower8-vector -Wno-psabi" } */
4
5 #ifndef CHECK_H
6 #define CHECK_H "sse4_1-check.h"
7 #endif
8
9 #ifndef TEST
10 #define TEST sse4_1_test
11 #endif
12
13 #include CHECK_H
14
15 #include <smmintrin.h>
16 #include <string.h>
17 #include <stdlib.h>
18
19 #define NUM 20
20
21 #ifndef MASK
22 #define MASK 0x0f
23 #endif
24
25 static void
26 init_blendps (float *src1, float *src2)
27 {
28 int i, sign = 1;
29
30 for (i = 0; i < NUM * 4; i++)
31 {
32 src1[i] = i * i * sign;
33 src2[i] = (i + 20) * sign;
34 sign = -sign;
35 }
36 }
37
38 static int
39 check_blendps (__m128 *dst, float *src1, float *src2)
40 {
41 float tmp[4];
42 int j;
43
44 memcpy (&tmp[0], src1, sizeof (tmp));
45 for (j = 0; j < 4; j++)
46 if ((MASK & (1 << j)))
47 tmp[j] = src2[j];
48
49 return memcmp (dst, &tmp[0], sizeof (tmp));
50 }
51
52 static void
53 TEST (void)
54 {
55 __m128 x, y;
56 union
57 {
58 __m128 x[NUM];
59 float f[NUM * 4];
60 } dst, src1, src2;
61 union
62 {
63 __m128 x;
64 float f[4];
65 } src3;
66 int i;
67
68 init_blendps (src1.f, src2.f);
69
70 for (i = 0; i < 4; i++)
71 src3.f[i] = (int) rand ();
72
73 /* Check blendps imm8, m128, xmm */
74 for (i = 0; i < NUM; i++)
75 {
76 dst.x[i] = _mm_blend_ps (src1.x[i], src2.x[i], MASK);
77 if (check_blendps (&dst.x[i], &src1.f[i * 4], &src2.f[i * 4]))
78 abort ();
79 }
80
81 /* Check blendps imm8, xmm, xmm */
82 x = _mm_blend_ps (dst.x[2], src3.x, MASK);
83 y = _mm_blend_ps (src3.x, dst.x[2], MASK);
84
85 if (check_blendps (&x, &dst.f[8], &src3.f[0]))
86 abort ();
87
88 if (check_blendps (&y, &src3.f[0], &dst.f[8]))
89 abort ();
90 }