OpenCores
URL https://opencores.org/ocsvn/openrisc/openrisc/trunk

Subversion Repositories openrisc

[/] [openrisc/] [tags/] [gnu-src/] [gcc-4.5.1/] [gcc-4.5.1-or32-1.0rc1/] [gcc/] [testsuite/] [gcc.target/] [i386/] [fma4-nmaccXX.c] - Blame information for rev 318

Go to most recent revision | Details | Compare with Previous | View Log

Line No. Rev Author Line
1 318 jeremybenn
/* { dg-do run } */
2
/* { dg-require-effective-target fma4 } */
3
/* { dg-options "-O0 -mfma4" } */
4
 
5
#include "fma4-check.h"
6
 
7
#include <x86intrin.h>
8
#include <string.h>
9
 
10
#define NUM 20
11
 
12
union
13
{
14
  __m128 x[NUM];
15
  float f[NUM * 4];
16
  __m128d y[NUM];
17
  double d[NUM * 2];
18
} dst, res, src1, src2, src3;
19
 
20
/* Note that in macc*,msub*,mnmacc* and mnsub* instructions, the intermdediate
21
   product is not rounded, only the addition is rounded. */
22
 
23
static void
24
init_nmaccps ()
25
{
26
  int i;
27
  for (i = 0; i < NUM * 4; i++)
28
    {
29
      src1.f[i] = i;
30
      src2.f[i] = i + 10;
31
      src3.f[i] = i + 20;
32
    }
33
}
34
 
35
static void
36
init_nmaccpd ()
37
{
38
  int i;
39
  for (i = 0; i < NUM * 4; i++)
40
    {
41
      src1.d[i] = i;
42
      src2.d[i] = i + 10;
43
      src3.d[i] = i + 20;
44
    }
45
}
46
 
47
static int
48
check_nmaccps ()
49
{
50
  int i, j, check_fails = 0;
51
  for (i = 0; i < NUM * 4; i = i + 4)
52
    for (j = 0; j < 4; j++)
53
      {
54
        res.f[i + j] = - (src1.f[i + j] * src2.f[i + j]) + src3.f[i + j];
55
        if (dst.f[i + j] != res.f[i + j])
56
          check_fails++;
57
      }
58
  return check_fails++;
59
}
60
 
61
static int
62
check_nmaccpd ()
63
{
64
  int i, j, check_fails = 0;
65
  for (i = 0; i < NUM * 2; i = i + 2)
66
    for (j = 0; j < 2; j++)
67
      {
68
        res.d[i + j] = - (src1.d[i + j] * src2.d[i + j]) + src3.d[i + j];
69
        if (dst.d[i + j] != res.d[i + j])
70
          check_fails++;
71
      }
72
  return check_fails++;
73
}
74
 
75
 
76
static int
77
check_nmaccss ()
78
{
79
  int i, j, check_fails = 0;
80
  for (i = 0; i < NUM * 4; i = i + 4)
81
    {
82
      res.f[i] = - (src1.f[i] * src2.f[i]) + src3.f[i];
83
      if (dst.f[i] != res.f[i])
84
        check_fails++;
85
    }
86
  return check_fails++;
87
}
88
 
89
static int
90
check_nmaccsd ()
91
{
92
  int i, j, check_fails = 0;
93
  for (i = 0; i < NUM * 2; i = i + 2)
94
    {
95
      res.d[i] = - (src1.d[i] * src2.d[i]) + src3.d[i];
96
      if (dst.d[i] != res.d[i])
97
        check_fails++;
98
    }
99
  return check_fails++;
100
}
101
 
102
static void
103
fma4_test (void)
104
{
105
  int i;
106
 
107
  init_nmaccps ();
108
 
109
  for (i = 0; i < NUM; i++)
110
    dst.x[i] = _mm_nmacc_ps (src1.x[i], src2.x[i], src3.x[i]);
111
 
112
  if (check_nmaccps ())
113
    abort ();
114
 
115
 
116
  for (i = 0; i < NUM; i++)
117
    dst.x[i] = _mm_nmacc_ss (src1.x[i], src2.x[i], src3.x[i]);
118
 
119
  if (check_nmaccss ())
120
    abort ();
121
 
122
  init_nmaccpd ();
123
 
124
  for (i = 0; i < NUM; i++)
125
    dst.y[i] = _mm_nmacc_pd (src1.y[i], src2.y[i], src3.y[i]);
126
 
127
  if (check_nmaccpd ())
128
    abort ();
129
 
130
 
131
  for (i = 0; i < NUM; i++)
132
    dst.y[i] = _mm_nmacc_sd (src1.y[i], src2.y[i], src3.y[i]);
133
 
134
  if (check_nmaccsd ())
135
    abort ();
136
 
137
}

powered by: WebSVN 2.1.0

© copyright 1999-2024 OpenCores.org, equivalent to Oliscience, all rights reserved. OpenCores®, registered trademark.