blob: 277f3a69db9a2960de20a36ca2aba0e8e56512c4 [file] [log] [blame]
/* APPLE LOCAL file 5612787 mainline sse4 */
/* { dg-do run { target i?86-*-* x86_64-*-* } } */
/* { dg-require-effective-target sse4a } */
/* { dg-options "-O2 -msse4a" } */
#include <ammintrin.h>
#include <stdlib.h>
#include "../../gcc.dg/i386-cpuid.h"
static void sse4a_test (void);
int
main ()
{
unsigned long cpu_facilities;
cpu_facilities = i386_extended_cpuid_ecx ();
/* Run SSE4a test only if host has SSE4a support. */
if ((cpu_facilities & bit_SSE4a))
sse4a_test ();
exit (0);
}
static void
sse4a_test_movntss (float *out, float *in)
{
__m128 in_v4sf = _mm_load_ss (in);
_mm_stream_ss (out, in_v4sf);
}
static int
chk_ss (float *v1, float *v2)
{
int n_fails = 0;
if (v1[0] != v2[0])
n_fails += 1;
return n_fails;
}
float vals[10] =
{
100.0, 200.0, 300.0, 400.0, 5.0,
-1.0, .345, -21.5, 9.32, 8.41
};
static void
sse4a_test (void)
{
int i;
int fail = 0;
float *out;
out = (float *) malloc (sizeof (float));
for (i = 0; i < 10; i += 1)
{
sse4a_test_movntss (out, &vals[i]);
fail += chk_ss (out, &vals[i]);
}
if (fail != 0)
abort ();
exit (0);
}