Skip to content
Merged
Show file tree
Hide file tree
Changes from 1 commit
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
132 changes: 0 additions & 132 deletions libclc/clc/include/clc/relational/floatn.inc

This file was deleted.

97 changes: 0 additions & 97 deletions libclc/libspirv/include/libspirv/generic/math/floatn.inc

This file was deleted.

26 changes: 0 additions & 26 deletions libclc/libspirv/include/libspirv/generic/math/minmag.inc

This file was deleted.

2 changes: 2 additions & 0 deletions libclc/libspirv/lib/amdgcn-amdhsa/SOURCES
Original file line number Diff line number Diff line change
@@ -1,5 +1,7 @@

workitem/get_global_offset.ll
geometric/normalize.cl
geometric/fast_normalize.cl
group/group_ballot.cl
group/collectives.cl
group/collectives_helpers.ll
Expand Down
17 changes: 17 additions & 0 deletions libclc/libspirv/lib/amdgcn-amdhsa/geometric/fast_normalize.cl
Original file line number Diff line number Diff line change
@@ -0,0 +1,17 @@
//===----------------------------------------------------------------------===//
//
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//
//===----------------------------------------------------------------------===//

#include <libspirv/spirv.h>

_CLC_OVERLOAD _CLC_DEF float __spirv_ocl_fast_normalize(float p) {
return __spirv_ocl_normalize(p);
}

#define __CLC_BODY <fast_normalize.inc>
#define __FLOAT_ONLY
#include <clc/math/gentype.inc>
Original file line number Diff line number Diff line change
Expand Up @@ -6,12 +6,16 @@
//
//===----------------------------------------------------------------------===//

#if (__CLC_VECSIZE_OR_1 == 1 || __CLC_VECSIZE_OR_1 == 2 || \
__CLC_VECSIZE_OR_1 == 3 || __CLC_VECSIZE_OR_1 == 4)

#ifndef __CLC_SCALAR

// Only handle vector implementations
_CLC_OVERLOAD _CLC_DEF __CLC_FLOATN __spirv_ocl_fast_normalize(__CLC_FLOATN p) {
__CLC_FLOAT l2 = __spirv_Dot(p, p);
_CLC_OVERLOAD _CLC_DEF __CLC_GENTYPE __spirv_ocl_fast_normalize(__CLC_GENTYPE p) {
__CLC_SCALAR_GENTYPE l2 = __spirv_Dot(p, p);
return l2 == 0.0f ? p : p * __spirv_ocl_half_rsqrt(l2);
}

#endif
#endif
91 changes: 91 additions & 0 deletions libclc/libspirv/lib/amdgcn-amdhsa/geometric/normalize.cl
Original file line number Diff line number Diff line change
@@ -0,0 +1,91 @@
//===----------------------------------------------------------------------===//
//
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//
//===----------------------------------------------------------------------===//

#include <clc/clc_convert.h>
#include <clc/relational/clc_all.h>
#include <libspirv/spirv.h>

#define HALF_MAX_SQRT 0x1.0p+8h
#define HALF_MIN_SQRT 0x1.0p-8h

#define _CLC_SPIRV_NORMALIZE_IMPL(FP_TYPE, FLOAT_MARK, INT_TYPE, VLEN, \
MAX_SQRT, MIN_SQRT) \
_CLC_OVERLOAD _CLC_DEF FP_TYPE##VLEN __spirv_ocl_normalize( \
FP_TYPE##VLEN p) { \
if (__clc_all(p == (FP_TYPE##VLEN)0.0##FLOAT_MARK)) \
return p; \
FP_TYPE l2 = __spirv_Dot(p, p); \
if (l2 < FLT_MIN) { \
p *= MAX_SQRT; \
l2 = __spirv_Dot(p, p); \
} else if (l2 == INFINITY) { \
p *= MIN_SQRT; \
l2 = __spirv_Dot(p, p); \
if (l2 == INFINITY) { \
p = __spirv_ocl_copysign( \
__spirv_ocl_select( \
(FP_TYPE##VLEN)0.0##FLOAT_MARK, \
(FP_TYPE##VLEN)1.0##FLOAT_MARK, \
__clc_convert_##INT_TYPE##VLEN(__spirv_IsInf(p))), \
p); \
l2 = __spirv_Dot(p, p); \
} \
} \
return p * __spirv_ocl_rsqrt(l2); \
}

#define _CLC_SPIRV_NORMALIZE(VLEN) \
_CLC_SPIRV_NORMALIZE_IMPL(float, f, int, VLEN, 0x1.0p+86F, 0x1.0p-65f)

_CLC_OVERLOAD _CLC_DEF float __spirv_ocl_normalize(float p) {
return __spirv_ocl_sign(p);
}

_CLC_SPIRV_NORMALIZE(2)
_CLC_SPIRV_NORMALIZE(3)
_CLC_SPIRV_NORMALIZE(4)

#undef _CLC_SPIRV_NORMALIZE

#ifdef cl_khr_fp64

#pragma OPENCL EXTENSION cl_khr_fp64 : enable

#define _CLC_SPIRV_NORMALIZE(VLEN) \
_CLC_SPIRV_NORMALIZE_IMPL(double, , long, VLEN, 0x1.0p+563, 0x1.0p-513)

_CLC_OVERLOAD _CLC_DEF double __spirv_ocl_normalize(double p) {
return __spirv_ocl_sign(p);
}

_CLC_SPIRV_NORMALIZE(2)
_CLC_SPIRV_NORMALIZE(3)
_CLC_SPIRV_NORMALIZE(4)

#undef _CLC_SPIRV_NORMALIZE

#endif

#ifdef cl_khr_fp16

#pragma OPENCL EXTENSION cl_khr_fp16 : enable

#define _CLC_SPIRV_NORMALIZE(VLEN) \
_CLC_SPIRV_NORMALIZE_IMPL(half, h, short, VLEN, HALF_MAX_SQRT, HALF_MIN_SQRT)

_CLC_OVERLOAD _CLC_DEF half __spirv_ocl_normalize(half p) {
return __spirv_ocl_sign(p);
}

_CLC_SPIRV_NORMALIZE(2)
_CLC_SPIRV_NORMALIZE(3)
_CLC_SPIRV_NORMALIZE(4)

#undef _CLC_SPIRV_NORMALIZE

#endif
Loading
Loading