/* { dg-do run } */
|
/* { dg-do run } */
|
/* { dg-require-effective-target avx } */
|
/* { dg-require-effective-target avx } */
|
/* { dg-require-effective-target c99_runtime } */
|
/* { dg-require-effective-target c99_runtime } */
|
/* { dg-options "-O2 -mavx -std=c99" } */
|
/* { dg-options "-O2 -mavx -std=c99" } */
|
|
|
#include "avx-check.h"
|
#include "avx-check.h"
|
#include <math.h>
|
#include <math.h>
|
|
|
float s1[]={2134.3343, 6678.346, 453.345635, 54646.464356};
|
float s1[]={2134.3343, 6678.346, 453.345635, 54646.464356};
|
float s2[]={41124.234, 6678.346, 8653.65635, 856.43576};
|
float s2[]={41124.234, 6678.346, 8653.65635, 856.43576};
|
int dd[] = {1, 2, 3, 4};
|
int dd[] = {1, 2, 3, 4};
|
float d[4];
|
float d[4];
|
union{int i[4]; float f[4];} e;
|
union{int i[4]; float f[4];} e;
|
|
|
void check(unsigned imm, char *id)
|
void check(unsigned imm, char *id)
|
{
|
{
|
if(checkVi((int*)d, e.i, 4)){
|
if(checkVi((int*)d, e.i, 4)){
|
printf("mm_cmp_ss(0x%x, %s) FAILED\n", imm, id);
|
printf("mm_cmp_ss(0x%x, %s) FAILED\n", imm, id);
|
}
|
}
|
}
|
}
|
|
|
static void
|
static void
|
avx_test ()
|
avx_test ()
|
{
|
{
|
__m128 source1, source2, dest;
|
__m128 source1, source2, dest;
|
int i;
|
int i;
|
|
|
#define CMP(imm, rel) \
|
#define CMP(imm, rel) \
|
e.i[0] = rel ? -1 : 0; \
|
e.i[0] = rel ? -1 : 0; \
|
dest = _mm_loadu_ps((float*)dd); \
|
dest = _mm_loadu_ps((float*)dd); \
|
source1 = _mm_loadu_ps(s1); \
|
source1 = _mm_loadu_ps(s1); \
|
source2 = _mm_loadu_ps(s2); \
|
source2 = _mm_loadu_ps(s2); \
|
dest = _mm_cmp_ss(source1, source2, imm); \
|
dest = _mm_cmp_ss(source1, source2, imm); \
|
_mm_storeu_ps(d, dest); \
|
_mm_storeu_ps(d, dest); \
|
check(imm, "" #imm "");
|
check(imm, "" #imm "");
|
|
|
for(i = 1; i < 4; i++) e.f[i] = s1[i];
|
for(i = 1; i < 4; i++) e.f[i] = s1[i];
|
|
|
CMP(_CMP_EQ_OQ, !isunordered(s1[0], s2[0]) && s1[0] == s2[0]);
|
CMP(_CMP_EQ_OQ, !isunordered(s1[0], s2[0]) && s1[0] == s2[0]);
|
CMP(_CMP_LT_OS, !isunordered(s1[0], s2[0]) && s1[0] < s2[0]);
|
CMP(_CMP_LT_OS, !isunordered(s1[0], s2[0]) && s1[0] < s2[0]);
|
CMP(_CMP_LE_OS, !isunordered(s1[0], s2[0]) && s1[0] <= s2[0]);
|
CMP(_CMP_LE_OS, !isunordered(s1[0], s2[0]) && s1[0] <= s2[0]);
|
CMP(_CMP_UNORD_Q, isunordered(s1[0], s2[0]));
|
CMP(_CMP_UNORD_Q, isunordered(s1[0], s2[0]));
|
CMP(_CMP_NEQ_UQ, isunordered(s1[0], s2[0]) || s1[0] != s2[0]);
|
CMP(_CMP_NEQ_UQ, isunordered(s1[0], s2[0]) || s1[0] != s2[0]);
|
CMP(_CMP_NLT_US, isunordered(s1[0], s2[0]) || s1[0] >= s2[0]);
|
CMP(_CMP_NLT_US, isunordered(s1[0], s2[0]) || s1[0] >= s2[0]);
|
CMP(_CMP_NLE_US, isunordered(s1[0], s2[0]) || s1[0] > s2[0]);
|
CMP(_CMP_NLE_US, isunordered(s1[0], s2[0]) || s1[0] > s2[0]);
|
CMP(_CMP_ORD_Q, !isunordered(s1[0], s2[0]));
|
CMP(_CMP_ORD_Q, !isunordered(s1[0], s2[0]));
|
|
|
CMP(_CMP_EQ_UQ, isunordered(s1[0], s2[0]) || s1[0] == s2[0]);
|
CMP(_CMP_EQ_UQ, isunordered(s1[0], s2[0]) || s1[0] == s2[0]);
|
CMP(_CMP_NGE_US, isunordered(s1[0], s2[0]) || s1[0] < s2[0]);
|
CMP(_CMP_NGE_US, isunordered(s1[0], s2[0]) || s1[0] < s2[0]);
|
CMP(_CMP_NGT_US, isunordered(s1[0], s2[0]) || s1[0] <= s2[0]);
|
CMP(_CMP_NGT_US, isunordered(s1[0], s2[0]) || s1[0] <= s2[0]);
|
|
|
CMP(_CMP_FALSE_OQ, 0);
|
CMP(_CMP_FALSE_OQ, 0);
|
CMP(_CMP_NEQ_OQ, !isunordered(s1[0], s2[0]) && s1[0] != s2[0]);
|
CMP(_CMP_NEQ_OQ, !isunordered(s1[0], s2[0]) && s1[0] != s2[0]);
|
CMP(_CMP_GE_OS, !isunordered(s1[0], s2[0]) && s1[0] >= s2[0]);
|
CMP(_CMP_GE_OS, !isunordered(s1[0], s2[0]) && s1[0] >= s2[0]);
|
CMP(_CMP_GT_OS, !isunordered(s1[0], s2[0]) && s1[0] > s2[0]);
|
CMP(_CMP_GT_OS, !isunordered(s1[0], s2[0]) && s1[0] > s2[0]);
|
CMP(_CMP_TRUE_UQ, 1);
|
CMP(_CMP_TRUE_UQ, 1);
|
|
|
CMP(_CMP_EQ_OS, !isunordered(s1[0], s2[0]) && s1[0] == s2[0]);
|
CMP(_CMP_EQ_OS, !isunordered(s1[0], s2[0]) && s1[0] == s2[0]);
|
CMP(_CMP_LT_OQ, !isunordered(s1[0], s2[0]) && s1[0] < s2[0]);
|
CMP(_CMP_LT_OQ, !isunordered(s1[0], s2[0]) && s1[0] < s2[0]);
|
CMP(_CMP_LE_OQ, !isunordered(s1[0], s2[0]) && s1[0] <= s2[0]);
|
CMP(_CMP_LE_OQ, !isunordered(s1[0], s2[0]) && s1[0] <= s2[0]);
|
CMP(_CMP_UNORD_S, isunordered(s1[0], s2[0]));
|
CMP(_CMP_UNORD_S, isunordered(s1[0], s2[0]));
|
CMP(_CMP_NEQ_US, isunordered(s1[0], s2[0]) || s1[0] != s2[0]);
|
CMP(_CMP_NEQ_US, isunordered(s1[0], s2[0]) || s1[0] != s2[0]);
|
CMP(_CMP_NLT_UQ, isunordered(s1[0], s2[0]) || s1[0] >= s2[0]);
|
CMP(_CMP_NLT_UQ, isunordered(s1[0], s2[0]) || s1[0] >= s2[0]);
|
CMP(_CMP_NLE_UQ, isunordered(s1[0], s2[0]) || s1[0] > s2[0]);
|
CMP(_CMP_NLE_UQ, isunordered(s1[0], s2[0]) || s1[0] > s2[0]);
|
CMP(_CMP_ORD_S, !isunordered(s1[0], s2[0]));
|
CMP(_CMP_ORD_S, !isunordered(s1[0], s2[0]));
|
CMP(_CMP_EQ_US, isunordered(s1[0], s2[0]) || s1[0] == s2[0]);
|
CMP(_CMP_EQ_US, isunordered(s1[0], s2[0]) || s1[0] == s2[0]);
|
CMP(_CMP_NGE_UQ, isunordered(s1[0], s2[0]) || s1[0] < s2[0]);
|
CMP(_CMP_NGE_UQ, isunordered(s1[0], s2[0]) || s1[0] < s2[0]);
|
CMP(_CMP_NGT_UQ, isunordered(s1[0], s2[0]) || s1[0] <= s2[0]);
|
CMP(_CMP_NGT_UQ, isunordered(s1[0], s2[0]) || s1[0] <= s2[0]);
|
CMP(_CMP_FALSE_OS, 0);
|
CMP(_CMP_FALSE_OS, 0);
|
CMP(_CMP_NEQ_OS, !isunordered(s1[0], s2[0]) && s1[0] != s2[0]);
|
CMP(_CMP_NEQ_OS, !isunordered(s1[0], s2[0]) && s1[0] != s2[0]);
|
CMP(_CMP_GE_OQ, !isunordered(s1[0], s2[0]) && s1[0] >= s2[0]);
|
CMP(_CMP_GE_OQ, !isunordered(s1[0], s2[0]) && s1[0] >= s2[0]);
|
CMP(_CMP_GT_OQ, !isunordered(s1[0], s2[0]) && s1[0] > s2[0]);
|
CMP(_CMP_GT_OQ, !isunordered(s1[0], s2[0]) && s1[0] > s2[0]);
|
CMP(_CMP_TRUE_US, 1);
|
CMP(_CMP_TRUE_US, 1);
|
}
|
}
|
|
|