|
6 | 6 | // |
7 | 7 | //===----------------------------------------------------------------------===// |
8 | 8 |
|
| 9 | +#include <clc/geometric/clc_normalize.h> |
9 | 10 | #include <clc/opencl/clc.h> |
10 | 11 |
|
11 | | -_CLC_OVERLOAD _CLC_DEF float normalize(float p) { return sign(p); } |
| 12 | +#define FUNCTION normalize |
| 13 | +#define __CLC_GEOMETRIC_RET_GENTYPE |
| 14 | +#define __CLC_BODY <clc/geometric/unary_def.inc> |
12 | 15 |
|
13 | | -_CLC_OVERLOAD _CLC_DEF float2 normalize(float2 p) { |
14 | | - if (all(p == (float2)0.0F)) |
15 | | - return p; |
16 | | - |
17 | | - float l2 = dot(p, p); |
18 | | - |
19 | | - if (l2 < FLT_MIN) { |
20 | | - p *= 0x1.0p+86F; |
21 | | - l2 = dot(p, p); |
22 | | - } else if (l2 == INFINITY) { |
23 | | - p *= 0x1.0p-65f; |
24 | | - l2 = dot(p, p); |
25 | | - if (l2 == INFINITY) { |
26 | | - p = copysign(select((float2)0.0F, (float2)1.0F, isinf(p)), p); |
27 | | - l2 = dot(p, p); |
28 | | - } |
29 | | - } |
30 | | - return p * rsqrt(l2); |
31 | | -} |
32 | | - |
33 | | -_CLC_OVERLOAD _CLC_DEF float3 normalize(float3 p) { |
34 | | - if (all(p == (float3)0.0F)) |
35 | | - return p; |
36 | | - |
37 | | - float l2 = dot(p, p); |
38 | | - |
39 | | - if (l2 < FLT_MIN) { |
40 | | - p *= 0x1.0p+86F; |
41 | | - l2 = dot(p, p); |
42 | | - } else if (l2 == INFINITY) { |
43 | | - p *= 0x1.0p-66f; |
44 | | - l2 = dot(p, p); |
45 | | - if (l2 == INFINITY) { |
46 | | - p = copysign(select((float3)0.0F, (float3)1.0F, isinf(p)), p); |
47 | | - l2 = dot(p, p); |
48 | | - } |
49 | | - } |
50 | | - return p * rsqrt(l2); |
51 | | -} |
52 | | - |
53 | | -_CLC_OVERLOAD _CLC_DEF float4 normalize(float4 p) { |
54 | | - if (all(p == (float4)0.0F)) |
55 | | - return p; |
56 | | - |
57 | | - float l2 = dot(p, p); |
58 | | - |
59 | | - if (l2 < FLT_MIN) { |
60 | | - p *= 0x1.0p+86F; |
61 | | - l2 = dot(p, p); |
62 | | - } else if (l2 == INFINITY) { |
63 | | - p *= 0x1.0p-66f; |
64 | | - l2 = dot(p, p); |
65 | | - if (l2 == INFINITY) { |
66 | | - p = copysign(select((float4)0.0F, (float4)1.0F, isinf(p)), p); |
67 | | - l2 = dot(p, p); |
68 | | - } |
69 | | - } |
70 | | - return p * rsqrt(l2); |
71 | | -} |
72 | | - |
73 | | -#ifdef cl_khr_fp64 |
74 | | - |
75 | | -#pragma OPENCL EXTENSION cl_khr_fp64 : enable |
76 | | - |
77 | | -_CLC_OVERLOAD _CLC_DEF double normalize(double p) { return sign(p); } |
78 | | - |
79 | | -_CLC_OVERLOAD _CLC_DEF double2 normalize(double2 p) { |
80 | | - if (all(p == (double2)0.0)) |
81 | | - return p; |
82 | | - |
83 | | - double l2 = dot(p, p); |
84 | | - |
85 | | - if (l2 < DBL_MIN) { |
86 | | - p *= 0x1.0p+563; |
87 | | - l2 = dot(p, p); |
88 | | - } else if (l2 == INFINITY) { |
89 | | - p *= 0x1.0p-513; |
90 | | - l2 = dot(p, p); |
91 | | - if (l2 == INFINITY) { |
92 | | - p = copysign(select((double2)0.0, (double2)1.0, isinf(p)), p); |
93 | | - l2 = dot(p, p); |
94 | | - } |
95 | | - } |
96 | | - return p * rsqrt(l2); |
97 | | -} |
98 | | - |
99 | | -_CLC_OVERLOAD _CLC_DEF double3 normalize(double3 p) { |
100 | | - if (all(p == (double3)0.0)) |
101 | | - return p; |
102 | | - |
103 | | - double l2 = dot(p, p); |
104 | | - |
105 | | - if (l2 < DBL_MIN) { |
106 | | - p *= 0x1.0p+563; |
107 | | - l2 = dot(p, p); |
108 | | - } else if (l2 == INFINITY) { |
109 | | - p *= 0x1.0p-514; |
110 | | - l2 = dot(p, p); |
111 | | - if (l2 == INFINITY) { |
112 | | - p = copysign(select((double3)0.0, (double3)1.0, isinf(p)), p); |
113 | | - l2 = dot(p, p); |
114 | | - } |
115 | | - } |
116 | | - return p * rsqrt(l2); |
117 | | -} |
118 | | - |
119 | | -_CLC_OVERLOAD _CLC_DEF double4 normalize(double4 p) { |
120 | | - if (all(p == (double4)0.0)) |
121 | | - return p; |
122 | | - |
123 | | - double l2 = dot(p, p); |
124 | | - |
125 | | - if (l2 < DBL_MIN) { |
126 | | - p *= 0x1.0p+563; |
127 | | - l2 = dot(p, p); |
128 | | - } else if (l2 == INFINITY) { |
129 | | - p *= 0x1.0p-514; |
130 | | - l2 = dot(p, p); |
131 | | - if (l2 == INFINITY) { |
132 | | - p = copysign(select((double4)0.0, (double4)1.0, isinf(p)), p); |
133 | | - l2 = dot(p, p); |
134 | | - } |
135 | | - } |
136 | | - return p * rsqrt(l2); |
137 | | -} |
138 | | - |
139 | | -#endif |
| 16 | +#include <clc/math/gentype.inc> |
0 commit comments