summaryrefslogtreecommitdiff
path: root/gcc/testsuite/gcc.target/i386/xop-vpermil2ps-256-1.c
blob: d458d3e492b5326c345b5530a50fbc276cbfe7fe (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
/* { dg-do run } */
/* { dg-require-effective-target xop } */
/* { dg-options "-O2 -mxop" } */

#include "xop-check.h"

#include <x86intrin.h>

#ifndef ZERO_MATCH
#define ZERO_MATCH  3
#endif

static float
select2sp(float *src1, float *src2, int sel)
{
    float tmp;

    if ((sel & 0x7) == 0) tmp = src1[0];
    if ((sel & 0x7) == 1) tmp = src1[1];
    if ((sel & 0x7) == 2) tmp = src1[2];
    if ((sel & 0x7) == 3) tmp = src1[3];
    if ((sel & 0x7) == 4) tmp = src2[0];
    if ((sel & 0x7) == 5) tmp = src2[1];
    if ((sel & 0x7) == 6) tmp = src2[2];
    if ((sel & 0x7) == 7) tmp = src2[3];

    return tmp;
}
static float
sel_and_condzerosp(float *src1, float *src2, int sel, int imm8)
{
    float tmp;

    tmp = select2sp(src1, src2, sel & 0x7);

    if (((imm8 & 0x3) == 2) && ((sel & 0x8) == 0x8)) tmp = 0;
    if (((imm8 & 0x3) == 3) && ((sel & 0x8) == 0x0)) tmp = 0;

    return tmp;
}

void static
xop_test ()
{
    int i;
    union256  source1, source2, u;
    union256i_d source3;
    float s1[8]={1, 2, 3, 4, 5, 6, 7, 8};
    float s2[8]={9, 10, 11, 12, 13, 14, 15, 16};
    int   s3[8]={11, 2, 3, 15, 5, 12, 7, 8};
    float  e[8];

    source1.x = _mm256_loadu_ps(s1);
    source2.x = _mm256_loadu_ps(s2);
    source3.x = _mm256_loadu_si256((__m256i*) s3);
    u.x = _mm256_permute2_ps(source1.x, source2.x, source3.x, ZERO_MATCH);

    for (i = 0; i < 8; ++i) {
        e[i] = sel_and_condzerosp(&s1[i & 0x4], &s2[i & 0x4], s3[i] & 0xf, ZERO_MATCH & 0x3);
    }

   if (check_union256(u, e))
     abort ();
}