37 lines
1.2 KiB
C
37 lines
1.2 KiB
C
|
/* { dg-do compile } */
|
||
|
/* { dg-require-effective-target powerpc_p8vector_ok } */
|
||
|
/* { dg-options "-mdejagnu-cpu=power8 -O3 " } */
|
||
|
/* { dg-final { scan-assembler-times "lxvd2x" 2 } } */
|
||
|
/* { dg-final { scan-assembler-times "stxvd2x" 1 } } */
|
||
|
/* { dg-final { scan-assembler-times "xxpermdi" 3 } } */
|
||
|
|
||
|
/* Verify that swap optimization works correctly for a VSX direct splat.
|
||
|
The three xxpermdi's that are generated correspond to two splats
|
||
|
and the __builtin_vsx_xxpermdi. */
|
||
|
|
||
|
int printf (const char *__restrict __format, ...);
|
||
|
typedef double __m128d __attribute__ ((__vector_size__ (16), __may_alias__));
|
||
|
|
||
|
double s1[] = {2134.3343, 6678.346};
|
||
|
double s2[] = {41124.234, 6678.346};
|
||
|
long long dd[] = {1, 2}, d[2];
|
||
|
union{long long l[2]; double d[2];} e;
|
||
|
|
||
|
void
|
||
|
foo ()
|
||
|
{
|
||
|
__m128d source1, source2, dest;
|
||
|
__m128d a, b, c;
|
||
|
|
||
|
e.d[1] = s1[1];
|
||
|
e.l[0] = !__builtin_isunordered(s1[0], s2[0])
|
||
|
&& s1[0] == s2[0] ? -1 : 0;
|
||
|
source1 = __builtin_vec_vsx_ld (0, s1);
|
||
|
source2 = __builtin_vec_vsx_ld (0, s2);
|
||
|
a = __builtin_vec_splat (source1, 0);
|
||
|
b = __builtin_vec_splat (source2, 0);
|
||
|
c = (__m128d)__builtin_vec_cmpeq (a, b);
|
||
|
dest = __builtin_vsx_xxpermdi (source1, c, 1);
|
||
|
*(__m128d *)d = dest;
|
||
|
}
|