/* { dg-do run } */
|
/* { dg-do run } */
|
/* { dg-require-effective-target sse4a } */
|
/* { dg-require-effective-target sse4a } */
|
/* { dg-options "-O2 -msse4a" } */
|
/* { dg-options "-O2 -msse4a" } */
|
|
|
#include "sse4a-check.h"
|
#include "sse4a-check.h"
|
|
|
#include <ammintrin.h>
|
#include <ammintrin.h>
|
|
|
static void
|
static void
|
sse4a_test_movntss (float *out, float *in)
|
sse4a_test_movntss (float *out, float *in)
|
{
|
{
|
__m128 in_v4sf = _mm_load_ss (in);
|
__m128 in_v4sf = _mm_load_ss (in);
|
_mm_stream_ss (out, in_v4sf);
|
_mm_stream_ss (out, in_v4sf);
|
}
|
}
|
|
|
static int
|
static int
|
chk_ss (float *v1, float *v2)
|
chk_ss (float *v1, float *v2)
|
{
|
{
|
int n_fails = 0;
|
int n_fails = 0;
|
if (v1[0] != v2[0])
|
if (v1[0] != v2[0])
|
n_fails += 1;
|
n_fails += 1;
|
return n_fails;
|
return n_fails;
|
}
|
}
|
|
|
float vals[10] =
|
float vals[10] =
|
{
|
{
|
100.0, 200.0, 300.0, 400.0, 5.0,
|
100.0, 200.0, 300.0, 400.0, 5.0,
|
-1.0, .345, -21.5, 9.32, 8.41
|
-1.0, .345, -21.5, 9.32, 8.41
|
};
|
};
|
|
|
static void
|
static void
|
sse4a_test (void)
|
sse4a_test (void)
|
{
|
{
|
int i;
|
int i;
|
int fail = 0;
|
int fail = 0;
|
float *out;
|
float *out;
|
|
|
out = (float *) malloc (sizeof (float));
|
out = (float *) malloc (sizeof (float));
|
for (i = 0; i < 10; i += 1)
|
for (i = 0; i < 10; i += 1)
|
{
|
{
|
sse4a_test_movntss (out, &vals[i]);
|
sse4a_test_movntss (out, &vals[i]);
|
|
|
fail += chk_ss (out, &vals[i]);
|
fail += chk_ss (out, &vals[i]);
|
}
|
}
|
|
|
if (fail != 0)
|
if (fail != 0)
|
abort ();
|
abort ();
|
}
|
}
|
|
|