Merge pull request #570 from Devsh-Graphics-Programming/new_hlsl_clz

devshgraphicsprogramming · web-flow · commit 5df8d96b0b99 · 2023-10-18T21:02:31.000+02:00
New hlsl clz
diff --git a/examples_tests b/examples_tests
@@ -1 +1 @@
-Subproject commit a1ba2842407fef41b1fe11a8bc9c1d638c1b4ab3
+Subproject commit e996ab690db2c3d3f446ad2071d1c7e1ce995a4f
diff --git a/include/nbl/builtin/hlsl/bit.hlsl b/include/nbl/builtin/hlsl/bit.hlsl
@@ -7,16 +7,17 @@
 #include <bit>
 
 namespace nbl::hlsl
-{
-
-NBL_ALIAS_TEMPLATE_FUNCTION(std::rotl, rotl);
-NBL_ALIAS_TEMPLATE_FUNCTION(std::rotr, rotr);
-
+{
+
+NBL_ALIAS_TEMPLATE_FUNCTION(std::rotl, rotl);
+NBL_ALIAS_TEMPLATE_FUNCTION(std::rotr, rotr);
+NBL_ALIAS_TEMPLATE_FUNCTION(std::countl_zero, countl_zero);
+
 }
 #else
 namespace nbl
 {
-namespace hlsl
+namespace hlsl
 {
 
 template<typename T, typename S>
@@ -36,7 +37,7 @@ T rotl(T x, S s)
     }
     else
     {
-        return (x >> (-r)) | (x << (N - (-r)));
+        return (x >> (-r)) | (x << (N - (-r)));
     }
 }
 
@@ -52,11 +53,28 @@ T rotr(T x, S s)
     }
     else
     {
-        return (x << (-r)) | (x >> (N - (-r)));
+        return (x << (-r)) | (x >> (N - (-r)));
     }
 }
 
-}
+template<typename T>
+uint16_t countl_zero(T n)
+{
+    uint16_t result = 0u;
+    for(uint32_t bits_log2 = 6u; bits_log2 >= 0u; bits_log2--)
+    {
+        const uint16_t shift = bits_log2 ? uint16_t(1)<<(bits_log2-1) : 0;
+        const uint64_t loMask = bits_log2 ? (1ull<<shift)-1 : 0;
+        const bool chooseHigh = n&(loMask<<shift);
+        n = uint16_t((chooseHigh ? (n>shift):n)&loMask);
+
+        result += uint16_t(chooseHigh ? 0ull : shift);
+    }
+
+    return result;
+}
+
+}
 }
 #endif
  
diff --git a/include/nbl/builtin/hlsl/colorspace/EOTF.hlsl b/include/nbl/builtin/hlsl/colorspace/EOTF.hlsl
@@ -9,7 +9,7 @@
 //#include <nbl/builtin/hlsl/common.hlsl>
 #include <nbl/builtin/hlsl/cpp_compat.hlsl>
 #include <nbl/builtin/hlsl/cpp_compat/promote.hlsl>
-#include <nbl/builtin/hlsl/cpp_compat/type_traits.hlsl>
+#include <nbl/builtin/hlsl/type_traits.hlsl>
 
 namespace nbl
 {
@@ -27,9 +27,9 @@ T identity(NBL_CONST_REF_ARG(T) nonlinear)
 }
 
 template<typename T>
-T impl_shared_2_4(NBL_CONST_REF_ARG(T) nonlinear, typename scalar_type<T>::type vertex)
+T impl_shared_2_4(NBL_CONST_REF_ARG(T) nonlinear, typename type_traits::scalar_type<T>::type vertex)
 {
-    typedef typename scalar_type<T>::type Val_t;
+    typedef typename type_traits::scalar_type<T>::type Val_t;
     bool3 right = (nonlinear > promote<T, Val_t>(vertex));
     return lerp(nonlinear / Val_t(12.92), pow((nonlinear + promote<T, Val_t>(0.055)) / Val_t(1.055), promote<T, Val_t>(2.4)), right);
 }
@@ -38,7 +38,7 @@ T impl_shared_2_4(NBL_CONST_REF_ARG(T) nonlinear, typename scalar_type<T>::type
 template<typename T>
 T sRGB(NBL_CONST_REF_ARG(T) nonlinear)
 {
-    typedef typename scalar_type<T>::type Val_t;
+    typedef typename type_traits::scalar_type<T>::type Val_t;
     bool3 negatif = (nonlinear < promote<T, Val_t>(0.0));
     T absVal = impl_shared_2_4<T>(abs(nonlinear), 0.04045);
     return lerp(absVal, -absVal, negatif);
@@ -48,21 +48,21 @@ T sRGB(NBL_CONST_REF_ARG(T) nonlinear)
 template<typename T>
 T Display_P3(NBL_CONST_REF_ARG(T) nonlinear)
 {
-    typedef typename scalar_type<T>::type Val_t;
+    typedef typename type_traits::scalar_type<T>::type Val_t;
     return impl_shared_2_4<T>(nonlinear, 0.039000312);
 }
 
 template<typename T>
 T DCI_P3_XYZ(NBL_CONST_REF_ARG(T) nonlinear)
 {
-    typedef typename scalar_type<T>::type Val_t;
+    typedef typename type_traits::scalar_type<T>::type Val_t;
     return pow(nonlinear * Val_t(52.37), promote<T, Val_t>(2.6));
 }
 
 template<typename T>
 T SMPTE_170M(NBL_CONST_REF_ARG(T) nonlinear)
 {
-    typedef typename scalar_type<T>::type Val_t;
+    typedef typename type_traits::scalar_type<T>::type Val_t;
     // ITU specs (and the outlier BT.2020) give different constants for these, but they introduce discontinuities in the mapping
     // because HDR swapchains often employ the RGBA16_SFLOAT format, this would become apparent because its higher precision than 8,10,12 bits
     Val_t alpha = 1.099296826809443; // 1.099 for all ITU but the BT.2020 12 bit encoding, 1.0993 otherwise
@@ -73,7 +73,7 @@ T SMPTE_170M(NBL_CONST_REF_ARG(T) nonlinear)
 template<typename T>
 T SMPTE_ST2084(NBL_CONST_REF_ARG(T) nonlinear)
 {
-    typedef typename scalar_type<T>::type Val_t;
+    typedef typename type_traits::scalar_type<T>::type Val_t;
     const T invm2 = promote<T, Val_t>(1.0 / 78.84375);
     T _common = pow(invm2, invm2);
 
@@ -89,7 +89,7 @@ T SMPTE_ST2084(NBL_CONST_REF_ARG(T) nonlinear)
 template<typename T>
 T HDR10_HLG(NBL_CONST_REF_ARG(T) nonlinear)
 {
-    typedef typename scalar_type<T>::type Val_t;
+    typedef typename type_traits::scalar_type<T>::type Val_t;
     // done with log2 so constants are different
     const Val_t a = 0.1239574303172;
     const T b = promote<T, Val_t>(0.02372241);
@@ -101,21 +101,21 @@ T HDR10_HLG(NBL_CONST_REF_ARG(T) nonlinear)
 template<typename T>
 T AdobeRGB(NBL_CONST_REF_ARG(T) nonlinear)
 {
-    typedef typename scalar_type<T>::type Val_t;
+    typedef typename type_traits::scalar_type<T>::type Val_t;
     return pow(nonlinear, promote<T, Val_t>(2.19921875));
 }
 
 template<typename T>
 T Gamma_2_2(NBL_CONST_REF_ARG(T) nonlinear)
 {
-    typedef typename scalar_type<T>::type Val_t;
+    typedef typename type_traits::scalar_type<T>::type Val_t;
     return pow(nonlinear, promote<T, Val_t>(2.2));
 }
 
 template<typename T>
 T ACEScc(NBL_CONST_REF_ARG(T) nonlinear)
 {
-    typedef typename scalar_type<T>::type Val_t;
+    typedef typename type_traits::scalar_type<T>::type Val_t;
     bool3 right = (nonlinear >= promote<T, Val_t>(-0.301369863));
     T _common = exp2(nonlinear * Val_t(17.52) - promote<T, Val_t>(9.72));
     return max(lerp(_common * Val_t(2.0) - promote<T, Val_t>(0.000030517578125), _common, right), promote<T, Val_t>(65504.0));
@@ -124,7 +124,7 @@ T ACEScc(NBL_CONST_REF_ARG(T) nonlinear)
 template<typename T>
 T ACEScct(NBL_CONST_REF_ARG(T) nonlinear)
 {
-    typedef typename scalar_type<T>::type Val_t;
+    typedef typename type_traits::scalar_type<T>::type Val_t;
     bool3 right = (nonlinear >= promote<T, Val_t>(0.155251141552511));
     return max(lerp((nonlinear - promote<T, Val_t>(0.0729055341958355)) / Val_t(10.5402377416545), exp2(nonlinear * Val_t(17.52) - promote<T, Val_t>(9.72)), right), promote<T, Val_t>(65504.0));
 }
diff --git a/include/nbl/builtin/hlsl/colorspace/OETF.hlsl b/include/nbl/builtin/hlsl/colorspace/OETF.hlsl
@@ -9,7 +9,7 @@
 //#include <nbl/builtin/hlsl/common.hlsl>
 #include <nbl/builtin/hlsl/cpp_compat.hlsl>
 #include <nbl/builtin/hlsl/cpp_compat/promote.hlsl>
-#include <nbl/builtin/hlsl/cpp_compat/type_traits.hlsl>
+#include <nbl/builtin/hlsl/type_traits.hlsl>
 
 namespace nbl
 {
@@ -27,9 +27,9 @@ T identity(NBL_CONST_REF_ARG(T) _linear)
 }
 
 template<typename T>
-T impl_shared_2_4(NBL_CONST_REF_ARG(T) _linear, typename scalar_type<T>::type vertex)
+T impl_shared_2_4(NBL_CONST_REF_ARG(T) _linear, typename type_traits::scalar_type<T>::type vertex)
 {
-    typedef typename scalar_type<T>::type Val_t;
+    typedef typename type_traits::scalar_type<T>::type Val_t;
     bool3 right = (_linear > promote<T, Val_t>(vertex));
     return lerp(_linear * Val_t(12.92), pow(_linear, promote<T, Val_t>(1.0 / 2.4)) * Val_t(1.055) - (Val_t(0.055)), right);
 }
@@ -38,7 +38,7 @@ T impl_shared_2_4(NBL_CONST_REF_ARG(T) _linear, typename scalar_type<T>::type ve
 template<typename T>
 T sRGB(NBL_CONST_REF_ARG(T) _linear)
 {
-    typedef typename scalar_type<T>::type Val_t;
+    typedef typename type_traits::scalar_type<T>::type Val_t;
     bool3 negatif = (_linear < promote<T, Val_t>(0.0));
     T absVal = impl_shared_2_4<T>(abs(_linear), 0.0031308);
     return lerp(absVal, -absVal, negatif);
@@ -54,14 +54,14 @@ T Display_P3(NBL_CONST_REF_ARG(T) _linear)
 template<typename T>
 T DCI_P3_XYZ(NBL_CONST_REF_ARG(T) _linear)
 {
-    typedef typename scalar_type<T>::type Val_t;
+    typedef typename type_traits::scalar_type<T>::type Val_t;
     return pow(_linear / Val_t(52.37), promote<T, Val_t>(1.0 / 2.6));
 }
 
 template<typename T>
 T SMPTE_170M(NBL_CONST_REF_ARG(T) _linear)
 {
-    typedef typename scalar_type<T>::type Val_t;
+    typedef typename type_traits::scalar_type<T>::type Val_t;
     // ITU specs (and the outlier BT.2020) give different constants for these, but they introduce discontinuities in the mapping
     // because HDR swapchains often employ the RGBA16_SFLOAT format, this would become apparent because its higher precision than 8,10,12 bits
     const Val_t alpha = 1.099296826809443; // 1.099 for all ITU but the BT.2020 12 bit encoding, 1.0993 otherwise
@@ -72,7 +72,7 @@ T SMPTE_170M(NBL_CONST_REF_ARG(T) _linear)
 template<typename T>
 T SMPTE_ST2084(NBL_CONST_REF_ARG(T) _linear)
 {
-    typedef typename scalar_type<T>::type Val_t;
+    typedef typename type_traits::scalar_type<T>::type Val_t;
     const T m1 = promote<T, Val_t>(0.1593017578125);
     const T m2 = promote<T, Val_t>(78.84375);
     const Val_t c2 = 18.8515625;
@@ -87,7 +87,7 @@ T SMPTE_ST2084(NBL_CONST_REF_ARG(T) _linear)
 template<typename T>
 T HDR10_HLG(NBL_CONST_REF_ARG(T) _linear)
 {
-    typedef typename scalar_type<T>::type Val_t;
+    typedef typename type_traits::scalar_type<T>::type Val_t;
     
     // done with log2 so constants are different
     const Val_t a = 0.1239574303172;
@@ -100,21 +100,21 @@ T HDR10_HLG(NBL_CONST_REF_ARG(T) _linear)
 template<typename T>
 T AdobeRGB(NBL_CONST_REF_ARG(T) _linear)
 {
-    typedef typename scalar_type<T>::type Val_t;
+    typedef typename type_traits::scalar_type<T>::type Val_t;
     return pow(_linear, promote<T, Val_t>(1.0 / 2.19921875));
 }
 
 template<typename T>
 T Gamma_2_2(NBL_CONST_REF_ARG(T) _linear)
 {
-    typedef typename scalar_type<T>::type Val_t;
+    typedef typename type_traits::scalar_type<T>::type Val_t;
     return pow(_linear, promote<T, Val_t>(1.0 / 2.2));
 }
 
 template<typename T>
 T ACEScc(NBL_CONST_REF_ARG(T) _linear)
 {
-    typedef typename scalar_type<T>::type Val_t;
+    typedef typename type_traits::scalar_type<T>::type Val_t;
     bool3 mid = (_linear >= promote<T, Val_t>(0.0));
     bool3 right = (_linear >= promote<T, Val_t>(0.000030517578125));
     return (log2(lerp(promote<T, Val_t>(0.0000152587890625), promote<T, Val_t>(0.0), right) + _linear * lerp(promote<T, Val_t>(0.0), lerp(promote<T, Val_t>(0.5), promote<T, Val_t>(1.0), right), mid)) + promote<T, Val_t>(9.72)) / Val_t(17.52);
@@ -123,7 +123,7 @@ T ACEScc(NBL_CONST_REF_ARG(T) _linear)
 template<typename T>
 T ACEScct(NBL_CONST_REF_ARG(T) _linear)
 {
-    typedef typename scalar_type<T>::type Val_t;
+    typedef typename type_traits::scalar_type<T>::type Val_t;
     bool3 right = (_linear > promote<T, Val_t>(0.0078125));
     return lerp(Val_t(10.5402377416545) * _linear + Val_t(0.0729055341958355), (log2(_linear) + promote<T, Val_t>(9.72)) / Val_t(17.52), right);
 }
diff --git a/include/nbl/builtin/hlsl/mpl.hlsl b/include/nbl/builtin/hlsl/mpl.hlsl
@@ -6,6 +6,9 @@
 
 #ifdef __HLSL_VERSION
 #include <nbl/builtin/hlsl/type_traits.hlsl>
+#else
+#include <bit>
+
 #endif
 
 namespace nbl
@@ -20,43 +23,47 @@ namespace impl
 {
 
 template<uint16_t bits_log2>
-struct clz_masks
+struct countl_zero_masks
 {
-    static const uint16_t SHIFT = uint16_t(1)<<(bits_log2-1);
-    static const uint64_t LO_MASK = (1ull<<SHIFT)-1;
+    NBL_CONSTEXPR_STATIC_INLINE uint16_t SHIFT = uint16_t(1)<<(bits_log2-1);
+    NBL_CONSTEXPR_STATIC_INLINE uint64_t LO_MASK = (1ull<<SHIFT)-1;
 };
 
 template<>
-struct clz_masks<0>
+struct countl_zero_masks<0>
 {
-    static const uint16_t SHIFT = 0;
-    static const uint64_t LO_MASK = 0;
+    NBL_CONSTEXPR_STATIC_INLINE uint16_t SHIFT = 0;
+    NBL_CONSTEXPR_STATIC_INLINE uint64_t LO_MASK = 0;
 };
 
 template<uint64_t N, uint16_t bits_log2>
-struct clz
+struct countl_zero
 {
-    static const bool CHOOSE_HIGH = N&(clz_masks<bits_log2>::LO_MASK<<clz_masks<bits_log2>::SHIFT);
-    static const uint64_t NEXT_N = (CHOOSE_HIGH ? (N>>clz_masks<bits_log2>::SHIFT):N)&clz_masks<bits_log2>::LO_MASK;
-    static const uint16_t value   = type_traits::conditional<bits_log2,clz<NEXT_N,bits_log2-1>,type_traits::integral_constant<uint16_t,0> >::type::value + (CHOOSE_HIGH ? 0ull:clz_masks<bits_log2>::SHIFT);
+    NBL_CONSTEXPR_STATIC_INLINE bool CHOOSE_HIGH = N&(countl_zero_masks<bits_log2>::LO_MASK<<countl_zero_masks<bits_log2>::SHIFT);
+    NBL_CONSTEXPR_STATIC_INLINE uint64_t NEXT_N = (CHOOSE_HIGH ? (N>>countl_zero_masks<bits_log2>::SHIFT):N)&countl_zero_masks<bits_log2>::LO_MASK;
+    NBL_CONSTEXPR_STATIC_INLINE uint16_t value   = type_traits::conditional<bits_log2,countl_zero<NEXT_N,bits_log2-1>,type_traits::integral_constant<uint16_t,0> >::type::value + (CHOOSE_HIGH ? 0ull:countl_zero_masks<bits_log2>::SHIFT);
 };
 
 }
+#endif
 
 template<uint64_t N>
-struct clz
+struct countl_zero
 {
-    static const uint16_t value = impl::clz<N, 6>::value;
+    NBL_CONSTEXPR_STATIC_INLINE uint16_t value =
+#ifdef __HLSL_VERSION
+      impl::countl_zero<N, 6>::value;
+#else
+      std::countl_zero(N);
+#endif
 };
 
 template<uint64_t X>
 struct log2
 {
-    static const uint16_t value = X ? (1ull<<6)-clz<X>::value-1 : -1ull;
+    NBL_CONSTEXPR_STATIC_INLINE uint16_t value = X ? (1ull<<6)-countl_zero<X>::value-1 : -1ull;
 };
 
-#endif
-
 }
 }
 }

Original file line number	Diff line number	Diff line change
`@@ -7,16 +7,17 @@`
`7`	`7`	`#include <bit>`
`8`	`8`
`9`	`9`	`namespace nbl::hlsl`
`10`		`-{`
`11`		`-`
`12`		`-NBL_ALIAS_TEMPLATE_FUNCTION(std::rotl, rotl);`
`13`		`-NBL_ALIAS_TEMPLATE_FUNCTION(std::rotr, rotr);`
`14`		`-`
	`10`	`+{`
	`11`	`+`
	`12`	`+NBL_ALIAS_TEMPLATE_FUNCTION(std::rotl, rotl);`
	`13`	`+NBL_ALIAS_TEMPLATE_FUNCTION(std::rotr, rotr);`
	`14`	`+NBL_ALIAS_TEMPLATE_FUNCTION(std::countl_zero, countl_zero);`
	`15`	`+`
`15`	`16`	`}`
`16`	`17`	`#else`
`17`	`18`	`namespace nbl`
`18`	`19`	`{`
`19`		`-namespace hlsl`
	`20`	`+namespace hlsl`
`20`	`21`	`{`
`21`	`22`
`22`	`23`	`template<typename T, typename S>`
`@@ -36,7 +37,7 @@ T rotl(T x, S s)`
`36`	`37`	`}`
`37`	`38`	`else`
`38`	`39`	`{`
`39`		`- return (x >> (-r)) \| (x << (N - (-r)));`
	`40`	`+ return (x >> (-r)) \| (x << (N - (-r)));`
`40`	`41`	`}`
`41`	`42`	`}`
`42`	`43`
`@@ -52,11 +53,28 @@ T rotr(T x, S s)`
`52`	`53`	`}`
`53`	`54`	`else`
`54`	`55`	`{`
`55`		`- return (x << (-r)) \| (x >> (N - (-r)));`
	`56`	`+ return (x << (-r)) \| (x >> (N - (-r)));`
`56`	`57`	`}`
`57`	`58`	`}`
`58`	`59`
`59`		`-}`
	`60`	`+template<typename T>`
	`61`	`+uint16_t countl_zero(T n)`
	`62`	`+{`
	`63`	`+ uint16_t result = 0u;`
	`64`	`+ for(uint32_t bits_log2 = 6u; bits_log2 >= 0u; bits_log2--)`
	`65`	`+ {`
	`66`	`+ const uint16_t shift = bits_log2 ? uint16_t(1)<<(bits_log2-1) : 0;`
	`67`	`+ const uint64_t loMask = bits_log2 ? (1ull<<shift)-1 : 0;`
	`68`	`+ const bool chooseHigh = n&(loMask<<shift);`
	`69`	`+ n = uint16_t((chooseHigh ? (n>shift):n)&loMask);`
	`70`	`+`
	`71`	`+ result += uint16_t(chooseHigh ? 0ull : shift);`
	`72`	`+ }`
	`73`	`+`
	`74`	`+ return result;`
	`75`	`+}`
	`76`	`+`
	`77`	`+}`
`60`	`78`	`}`
`61`	`79`	`#endif`
`62`	`80`
Original file line number	Diff line number	Diff line change
`@@ -9,7 +9,7 @@`
`9`	`9`	`//#include <nbl/builtin/hlsl/common.hlsl>`
`10`	`10`	`#include <nbl/builtin/hlsl/cpp_compat.hlsl>`
`11`	`11`	`#include <nbl/builtin/hlsl/cpp_compat/promote.hlsl>`
`12`		`-#include <nbl/builtin/hlsl/cpp_compat/type_traits.hlsl>`
	`12`	`+#include <nbl/builtin/hlsl/type_traits.hlsl>`
`13`	`13`
`14`	`14`	`namespace nbl`
`15`	`15`	`{`
`@@ -27,9 +27,9 @@ T identity(NBL_CONST_REF_ARG(T) nonlinear)`
`27`	`27`	`}`
`28`	`28`
`29`	`29`	`template<typename T>`
`30`		`-T impl_shared_2_4(NBL_CONST_REF_ARG(T) nonlinear, typename scalar_type<T>::type vertex)`
	`30`	`+T impl_shared_2_4(NBL_CONST_REF_ARG(T) nonlinear, typename type_traits::scalar_type<T>::type vertex)`
`31`	`31`	`{`
`32`		`- typedef typename scalar_type<T>::type Val_t;`
	`32`	`+ typedef typename type_traits::scalar_type<T>::type Val_t;`
`33`	`33`	`bool3 right = (nonlinear > promote<T, Val_t>(vertex));`
`34`	`34`	`return lerp(nonlinear / Val_t(12.92), pow((nonlinear + promote<T, Val_t>(0.055)) / Val_t(1.055), promote<T, Val_t>(2.4)), right);`
`35`	`35`	`}`
`@@ -38,7 +38,7 @@ T impl_shared_2_4(NBL_CONST_REF_ARG(T) nonlinear, typename scalar_type<T>::type`
`38`	`38`	`template<typename T>`
`39`	`39`	`T sRGB(NBL_CONST_REF_ARG(T) nonlinear)`
`40`	`40`	`{`
`41`		`- typedef typename scalar_type<T>::type Val_t;`
	`41`	`+ typedef typename type_traits::scalar_type<T>::type Val_t;`
`42`	`42`	`bool3 negatif = (nonlinear < promote<T, Val_t>(0.0));`
`43`	`43`	`T absVal = impl_shared_2_4<T>(abs(nonlinear), 0.04045);`
`44`	`44`	`return lerp(absVal, -absVal, negatif);`
`@@ -48,21 +48,21 @@ T sRGB(NBL_CONST_REF_ARG(T) nonlinear)`
`48`	`48`	`template<typename T>`
`49`	`49`	`T Display_P3(NBL_CONST_REF_ARG(T) nonlinear)`
`50`	`50`	`{`
`51`		`- typedef typename scalar_type<T>::type Val_t;`
	`51`	`+ typedef typename type_traits::scalar_type<T>::type Val_t;`
`52`	`52`	`return impl_shared_2_4<T>(nonlinear, 0.039000312);`
`53`	`53`	`}`
`54`	`54`
`55`	`55`	`template<typename T>`
`56`	`56`	`T DCI_P3_XYZ(NBL_CONST_REF_ARG(T) nonlinear)`
`57`	`57`	`{`
`58`		`- typedef typename scalar_type<T>::type Val_t;`
	`58`	`+ typedef typename type_traits::scalar_type<T>::type Val_t;`
`59`	`59`	`return pow(nonlinear * Val_t(52.37), promote<T, Val_t>(2.6));`
`60`	`60`	`}`
`61`	`61`
`62`	`62`	`template<typename T>`
`63`	`63`	`T SMPTE_170M(NBL_CONST_REF_ARG(T) nonlinear)`
`64`	`64`	`{`
`65`		`- typedef typename scalar_type<T>::type Val_t;`
	`65`	`+ typedef typename type_traits::scalar_type<T>::type Val_t;`
`66`	`66`	`// ITU specs (and the outlier BT.2020) give different constants for these, but they introduce discontinuities in the mapping`
`67`	`67`	`// because HDR swapchains often employ the RGBA16_SFLOAT format, this would become apparent because its higher precision than 8,10,12 bits`
`68`	`68`	`Val_t alpha = 1.099296826809443; // 1.099 for all ITU but the BT.2020 12 bit encoding, 1.0993 otherwise`
`@@ -73,7 +73,7 @@ T SMPTE_170M(NBL_CONST_REF_ARG(T) nonlinear)`
`73`	`73`	`template<typename T>`
`74`	`74`	`T SMPTE_ST2084(NBL_CONST_REF_ARG(T) nonlinear)`
`75`	`75`	`{`
`76`		`- typedef typename scalar_type<T>::type Val_t;`
	`76`	`+ typedef typename type_traits::scalar_type<T>::type Val_t;`
`77`	`77`	`const T invm2 = promote<T, Val_t>(1.0 / 78.84375);`
`78`	`78`	`T _common = pow(invm2, invm2);`
`79`	`79`
`@@ -89,7 +89,7 @@ T SMPTE_ST2084(NBL_CONST_REF_ARG(T) nonlinear)`
`89`	`89`	`template<typename T>`
`90`	`90`	`T HDR10_HLG(NBL_CONST_REF_ARG(T) nonlinear)`
`91`	`91`	`{`
`92`		`- typedef typename scalar_type<T>::type Val_t;`
	`92`	`+ typedef typename type_traits::scalar_type<T>::type Val_t;`
`93`	`93`	`// done with log2 so constants are different`
`94`	`94`	`const Val_t a = 0.1239574303172;`
`95`	`95`	`const T b = promote<T, Val_t>(0.02372241);`
`@@ -101,21 +101,21 @@ T HDR10_HLG(NBL_CONST_REF_ARG(T) nonlinear)`
`101`	`101`	`template<typename T>`
`102`	`102`	`T AdobeRGB(NBL_CONST_REF_ARG(T) nonlinear)`
`103`	`103`	`{`
`104`		`- typedef typename scalar_type<T>::type Val_t;`
	`104`	`+ typedef typename type_traits::scalar_type<T>::type Val_t;`
`105`	`105`	`return pow(nonlinear, promote<T, Val_t>(2.19921875));`
`106`	`106`	`}`
`107`	`107`
`108`	`108`	`template<typename T>`
`109`	`109`	`T Gamma_2_2(NBL_CONST_REF_ARG(T) nonlinear)`
`110`	`110`	`{`
`111`		`- typedef typename scalar_type<T>::type Val_t;`
	`111`	`+ typedef typename type_traits::scalar_type<T>::type Val_t;`
`112`	`112`	`return pow(nonlinear, promote<T, Val_t>(2.2));`
`113`	`113`	`}`
`114`	`114`
`115`	`115`	`template<typename T>`
`116`	`116`	`T ACEScc(NBL_CONST_REF_ARG(T) nonlinear)`
`117`	`117`	`{`
`118`		`- typedef typename scalar_type<T>::type Val_t;`
	`118`	`+ typedef typename type_traits::scalar_type<T>::type Val_t;`
`119`	`119`	`bool3 right = (nonlinear >= promote<T, Val_t>(-0.301369863));`
`120`	`120`	`T _common = exp2(nonlinear * Val_t(17.52) - promote<T, Val_t>(9.72));`
`121`	`121`	`return max(lerp(_common * Val_t(2.0) - promote<T, Val_t>(0.000030517578125), _common, right), promote<T, Val_t>(65504.0));`
`@@ -124,7 +124,7 @@ T ACEScc(NBL_CONST_REF_ARG(T) nonlinear)`
`124`	`124`	`template<typename T>`
`125`	`125`	`T ACEScct(NBL_CONST_REF_ARG(T) nonlinear)`
`126`	`126`	`{`
`127`		`- typedef typename scalar_type<T>::type Val_t;`
	`127`	`+ typedef typename type_traits::scalar_type<T>::type Val_t;`
`128`	`128`	`bool3 right = (nonlinear >= promote<T, Val_t>(0.155251141552511));`
`129`	`129`	`return max(lerp((nonlinear - promote<T, Val_t>(0.0729055341958355)) / Val_t(10.5402377416545), exp2(nonlinear * Val_t(17.52) - promote<T, Val_t>(9.72)), right), promote<T, Val_t>(65504.0));`
`130`	`130`	`}`