aboutsummaryrefslogtreecommitdiff
path: root/SingleSource/UnitTests/Vector/AVX512/reduce_add_mul_m512.c
blob: 0a9669e5c86ac51691c5a415e82f5b3a7a20e821 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
#include "m512_test_util.h"
#include <stdio.h>
#include <string.h>

/*
 * Here we check for _mm512_[mask_]reduce_[add|mul] intrinsics.
 */

#define CHECK_PD(op)                                                           \
  {                                                                            \
    volatile double r = _mm512_##op##_pd(v1);                                  \
    check_equal_ndf(&r, &exp1, 1, "_mm512_" #op "_pd", __LINE__);              \
    k8 = 0xAA;                                                                 \
    r = _mm512_mask_##op##_pd(k8, v1);                                         \
    check_equal_ndf(&r, &exp2, 1, "_mm512_mask_" #op "_pd{1}", __LINE__);      \
  }

#define DECL_PD(op, srcv, out1, out2)                                          \
  void NOINLINE do_##op##_pd() {                                               \
    __mmask8 k8;                                                               \
    volatile __m512d v1 = _mm512_set1_pd((srcv));                              \
                                                                               \
    double exp1 = (out1);                                                      \
    double exp2 = (out2);                                                      \
                                                                               \
    CHECK_PD(op);                                                              \
  }

#define TEST_PD(op) do_##op##_pd()

// PS version starts here.

#define CHECK_PS(op)                                                           \
  {                                                                            \
    volatile float r = _mm512_##op##_ps(v1);                                   \
    check_equal_nsf(&r, &exp1, 1, "_mm512_" #op "_ps", __LINE__);              \
    k8 = 0xAAAA;                                                               \
    r = _mm512_mask_##op##_ps(k8, v1);                                         \
    check_equal_nsf(&r, &exp2, 1, "_mm512_mask_" #op "_ps{1}", __LINE__);      \
  }

#define DECL_PS(op, srcv, out1, out2)                                          \
  void NOINLINE do_##op##_ps() {                                               \
    __mmask16 k8;                                                              \
    volatile __m512 v1 = _mm512_set1_ps((srcv));                               \
                                                                               \
    float exp1 = (out1);                                                       \
    float exp2 = (out2);                                                       \
                                                                               \
    CHECK_PS(op);                                                              \
  }

#define TEST_PS(op) do_##op##_ps()

DECL_PD(reduce_add, 0.5, 4.0, 2.0)
DECL_PS(reduce_add, 0.4f, 6.4f, 3.2f)
DECL_PD(reduce_mul, 1.1, 2.1435f, 1.4641f)
DECL_PS(reduce_mul, -1.1f, 4.5949f, 2.1435f)

int main(int argc, char *argv[]) {
  TEST_PD(reduce_add);
  TEST_PS(reduce_add);
  TEST_PD(reduce_mul);
  TEST_PS(reduce_mul);

  if (n_errs != 0) {
    printf("FAILED\n");
    return 1;
  }

  printf("PASSED\n");
  return 0;
}