alpaka3/test/unit/math/Defines.hpp at ffcfc3c27f7c821655a684f024f58f47291b94a4 · psychocoderHPC/alpaka3 · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
/* Copyright 2022 Jakob Krude, Benjamin Worpitz, Sergei Bastrakov
 * SPDX-License-Identifier: MPL-2.0
 */

#pragma once

#include <alpaka/alpaka.hpp>

#include <cmath>
#include <iomanip>
#include <iostream>
#include <limits>

namespace mathtest
{
    // New types need to be added to the switch-case in DataGen.hpp
    enum class Range
    {
        OneNeighbourhood,
        PositiveOnly,
        PositiveAndZero,
        NotZero,
        Unrestricted,
        Anything
    };

    // New types need to be added to the operator() function in Functor.hpp
    enum class Arity
    {
        Unary = 1,
        Binary = 2,
        Ternary = 3
    };

    template<typename T, Arity Tarity>
    struct ArgsItem
    {
        static constexpr Arity arity = Tarity;
        static constexpr size_t arity_nr = static_cast<size_t>(Tarity);

        T arg[arity_nr]; // represents arg0, arg1, ...

        friend auto operator<<(std::ostream& os, ArgsItem const& argsItem) -> std::ostream&
        {
            os.precision(17);
            for(size_t i = 0; i < argsItem.arity_nr; ++i)
                os << (i == 0 ? "[ " : ", ") << std::setprecision(std::numeric_limits<T>::digits10 + 1)
                   << argsItem.arg[i];
            os << " ]";
            return os;
        }
    };

    //! Reference implementation of rsqrt, since there is no std::rsqrt
    template<typename T>
    auto rsqrt(T const& arg)
    {
        // Need ADL for complex numbers
        using std::sqrt;
        return static_cast<T>(1) / sqrt(arg);
    }

    //! Stub for division expressed same way as alpaka math traits
    template<typename T>
    ALPAKA_FN_HOST_ACC auto divides(T const& arg1, T const& arg2)
    {
        return arg1 / arg2;
    }

    //! Stub for subtraction expressed same way as alpaka math traits
    template<typename T>
    ALPAKA_FN_HOST_ACC auto minus(T const& arg1, T const& arg2)
    {
        return arg1 - arg2;
    }

    //! Stub for multiplication expressed same way as alpaka math traits
    template<typename T>
    ALPAKA_FN_HOST_ACC auto multiplies(T const& arg1, T const& arg2)
    {
        return arg1 * arg2;
    }

    //! Stub for addition expressed same way as alpaka math traits
    template<typename T>
    ALPAKA_FN_HOST_ACC auto plus(T const& arg1, T const& arg2)
    {
        return arg1 + arg2;
    }

    // https://en.cppreference.com/w/cpp/types/numeric_limits/epsilon
    template<typename FP>
    ALPAKA_FN_ACC auto almost_equal(FP x, FP y, int ulp)
        -> std::enable_if_t<!std::numeric_limits<FP>::is_integer, bool>
    {
        // the machine epsilon has to be scaled to the magnitude of the values used
        // and multiplied by the desired precision in ULPs (units in the last place)
        return alpaka::math::abs(x - y)
                   <= std::numeric_limits<FP>::epsilon() * alpaka::math::abs(x + y) * static_cast<FP>(ulp)
               // unless the result is subnormal
               || alpaka::math::abs(x - y) < std::numeric_limits<FP>::min();
    }

    //! Version for alpaka::math::Complex
    template<typename FP>
    ALPAKA_FN_ACC bool almost_equal(alpaka::math::Complex<FP> x, alpaka::math::Complex<FP> y, int ulp)
    {
        return almost_equal(x.real(), y.real(), ulp) && almost_equal(x.imag(), y.imag(), ulp);
    }

} // namespace mathtest