1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
|
/* { dg-do run } */
/* { dg-require-effective-target sse4a } */
/* { dg-options "-O2 -msse4a" } */
#include "sse4a-check.h"
#include <ammintrin.h>
static void
sse4a_test_movntsd (double *out, double *in)
{
__m128d in_v2df = _mm_load_sd (in);
_mm_stream_sd (out, in_v2df);
}
static int
chk_sd (double *v1, double *v2)
{
int n_fails = 0;
if (v1[0] != v2[0])
n_fails += 1;
return n_fails;
}
double vals[10] =
{
100.0, 200.0, 300.0, 400.0, 5.0,
-1.0, .345, -21.5, 9.32, 8.41
};
static void
sse4a_test (void)
{
int i;
int fail = 0;
double *out;
out = (double *) malloc (sizeof (double));
for (i = 0; i < 10; i += 1)
{
sse4a_test_movntsd (out, &vals[i]);
fail += chk_sd (out, &vals[i]);
}
if (fail != 0)
abort ();
}
|