/* { dg-do run } */
|
/* { dg-do run } */
|
/* { dg-require-effective-target xop } */
|
/* { dg-require-effective-target xop } */
|
/* { dg-options "-O2 -mxop" } */
|
/* { dg-options "-O2 -mxop" } */
|
|
|
#include "xop-check.h"
|
#include "xop-check.h"
|
|
|
#include <x86intrin.h>
|
#include <x86intrin.h>
|
|
|
#ifndef ZERO_MATCH
|
#ifndef ZERO_MATCH
|
#define ZERO_MATCH 3
|
#define ZERO_MATCH 3
|
#endif
|
#endif
|
|
|
static float
|
static float
|
select2sp(float *src1, float *src2, int sel)
|
select2sp(float *src1, float *src2, int sel)
|
{
|
{
|
float tmp;
|
float tmp;
|
|
|
if ((sel & 0x7) == 0) tmp = src1[0];
|
if ((sel & 0x7) == 0) tmp = src1[0];
|
if ((sel & 0x7) == 1) tmp = src1[1];
|
if ((sel & 0x7) == 1) tmp = src1[1];
|
if ((sel & 0x7) == 2) tmp = src1[2];
|
if ((sel & 0x7) == 2) tmp = src1[2];
|
if ((sel & 0x7) == 3) tmp = src1[3];
|
if ((sel & 0x7) == 3) tmp = src1[3];
|
if ((sel & 0x7) == 4) tmp = src2[0];
|
if ((sel & 0x7) == 4) tmp = src2[0];
|
if ((sel & 0x7) == 5) tmp = src2[1];
|
if ((sel & 0x7) == 5) tmp = src2[1];
|
if ((sel & 0x7) == 6) tmp = src2[2];
|
if ((sel & 0x7) == 6) tmp = src2[2];
|
if ((sel & 0x7) == 7) tmp = src2[3];
|
if ((sel & 0x7) == 7) tmp = src2[3];
|
|
|
return tmp;
|
return tmp;
|
}
|
}
|
static float
|
static float
|
sel_and_condzerosp(float *src1, float *src2, int sel, int imm8)
|
sel_and_condzerosp(float *src1, float *src2, int sel, int imm8)
|
{
|
{
|
float tmp;
|
float tmp;
|
|
|
tmp = select2sp(src1, src2, sel & 0x7);
|
tmp = select2sp(src1, src2, sel & 0x7);
|
|
|
if (((imm8 & 0x3) == 2) && ((sel & 0x8) == 0x8)) tmp = 0;
|
if (((imm8 & 0x3) == 2) && ((sel & 0x8) == 0x8)) tmp = 0;
|
if (((imm8 & 0x3) == 3) && ((sel & 0x8) == 0x0)) tmp = 0;
|
if (((imm8 & 0x3) == 3) && ((sel & 0x8) == 0x0)) tmp = 0;
|
|
|
return tmp;
|
return tmp;
|
}
|
}
|
|
|
void static
|
void static
|
xop_test ()
|
xop_test ()
|
{
|
{
|
int i;
|
int i;
|
union256 source1, source2, u;
|
union256 source1, source2, u;
|
union256i_d source3;
|
union256i_d source3;
|
float s1[8]={1, 2, 3, 4, 5, 6, 7, 8};
|
float s1[8]={1, 2, 3, 4, 5, 6, 7, 8};
|
float s2[8]={9, 10, 11, 12, 13, 14, 15, 16};
|
float s2[8]={9, 10, 11, 12, 13, 14, 15, 16};
|
int s3[8]={11, 2, 3, 15, 5, 12, 7, 8};
|
int s3[8]={11, 2, 3, 15, 5, 12, 7, 8};
|
float e[8];
|
float e[8];
|
|
|
source1.x = _mm256_loadu_ps(s1);
|
source1.x = _mm256_loadu_ps(s1);
|
source2.x = _mm256_loadu_ps(s2);
|
source2.x = _mm256_loadu_ps(s2);
|
source3.x = _mm256_loadu_si256((__m256i*) s3);
|
source3.x = _mm256_loadu_si256((__m256i*) s3);
|
u.x = _mm256_permute2_ps(source1.x, source2.x, source3.x, ZERO_MATCH);
|
u.x = _mm256_permute2_ps(source1.x, source2.x, source3.x, ZERO_MATCH);
|
|
|
for (i = 0; i < 8; ++i) {
|
for (i = 0; i < 8; ++i) {
|
e[i] = sel_and_condzerosp(&s1[i & 0x4], &s2[i & 0x4], s3[i] & 0xf, ZERO_MATCH & 0x3);
|
e[i] = sel_and_condzerosp(&s1[i & 0x4], &s2[i & 0x4], s3[i] & 0xf, ZERO_MATCH & 0x3);
|
}
|
}
|
|
|
if (check_union256(u, e))
|
if (check_union256(u, e))
|
abort ();
|
abort ();
|
}
|
}
|
|
|