more small issues resolved

Erfan-Ahmadi · Erfan-Ahmadi · commit 2e902d02266b · 2021-02-14T11:05:02.000+03:30
diff --git a/examples_tests/49.ComputeFFT/convolve.comp b/examples_tests/49.ComputeFFT/convolve.comp
@@ -8,21 +8,19 @@
 
 layout(local_size_x=256, local_size_y=1, local_size_z=1) in;
  
- #define complex_value vec2
-
 layout(set=0, binding=0) restrict readonly buffer SrcBuffer
 {
-	complex_value src_data[];
+	nbl_glsl_complex src_data[];
 };
 
 layout(set=0, binding=1) restrict readonly buffer KernelBuffer
 {
-	complex_value ker_data[];
+	nbl_glsl_complex ker_data[];
 };
 
 layout(set=0, binding=2) restrict buffer OutputBuffer
 {
-	complex_value out_data[];
+	nbl_glsl_complex out_data[];
 };
 
 layout(push_constant) uniform PushConstants
diff --git a/examples_tests/49.ComputeFFT/remove_padding.comp b/examples_tests/49.ComputeFFT/remove_padding.comp
@@ -4,16 +4,13 @@
 
 #version 430 core
 
+#include <nbl/builtin/glsl/math/complex.glsl>
+
 layout(local_size_x=16, local_size_y=16, local_size_z=1) in;
  
-struct nbl_glsl_ext_FFT_output_t
-{
-	vec2 complex_value;
-};
-
 layout(set=0, binding=0) restrict readonly buffer Buffer
 {
-	nbl_glsl_ext_FFT_output_t data[];
+	nbl_glsl_complex data[];
 };
 
 layout(set=0, binding=1, rgba16f) uniform image2D outImage;
@@ -38,7 +35,7 @@ void main()
     vec4 color_value = vec4(0, 0, 0, 0);
     for(uint c = 0; c < pc.numChannels; ++c) {
 	    uint index = c * (padded_dimension.x * padded_dimension.y) + padded_coords.y * (padded_dimension.x) + padded_coords.x;
-        color_value[c] = data[index].complex_value.x;
+        color_value[c] = data[index].x;
     }
     imageStore(outImage, coords, color_value);
 }
diff --git a/include/nbl/builtin/glsl/ext/FFT/fft.glsl b/include/nbl/builtin/glsl/ext/FFT/fft.glsl
@@ -9,6 +9,7 @@
 
 // Shared Memory
 #include <nbl/builtin/glsl/workgroup/shared_arithmetic.glsl>
+#include <nbl/builtin/glsl/math/functions.glsl>
 
 
 #ifndef _NBL_GLSL_EXT_FFT_MAX_DIM_SIZE_
@@ -81,33 +82,22 @@ vec2 nbl_glsl_ext_FFT_getPaddedData(in uvec3 coordinate, in uint channel);
 #error "You need to define `nbl_glsl_ext_FFT_getPaddedData` and mark `_NBL_GLSL_EXT_FFT_GET_PADDED_DATA_DEFINED_`!"
 #endif
 
-// Count Leading Zeroes (naive?)
-uint nbl_glsl_ext_FFT_clz(in uint x) 
-{
-    return 31u - findMSB(x);
-}
-
-uint nbl_glsl_ext_FFT_reverseBits(in uint x)
-{
-    return bitfieldReverse(x);
-}
-
 uint nbl_glsl_ext_FFT_calculateTwiddlePower(in uint threadId, in uint iteration, in uint logTwoN) 
 {
     const uint shiftSuffix = logTwoN - 1u - iteration; // can we assert that iteration<logTwoN always?? yes
     const uint suffixMask = (2u << iteration) - 1u;
     return (threadId & suffixMask) << shiftSuffix;
 }
 
-nbl_glsl_complex nbl_glsl_ext_FFT_twiddle(in uint threadId, in uint iteration, in uint logTwoN, in uint N) 
+nbl_glsl_complex nbl_glsl_ext_FFT_twiddle(in uint threadId, in uint iteration, in uint logTwoN) 
 {
     uint k = nbl_glsl_ext_FFT_calculateTwiddlePower(threadId, iteration, logTwoN);
-    return nbl_glsl_expImaginary(-1 * 2 * nbl_glsl_PI * k / N);
+    return nbl_glsl_expImaginary(-1.0f * 2.0f * nbl_glsl_PI * float(k) / (1 << logTwoN));
 }
 
-nbl_glsl_complex nbl_glsl_ext_FFT_twiddleInverse(in uint threadId, in uint iteration, in uint logTwoN, in uint N) 
+nbl_glsl_complex nbl_glsl_ext_FFT_twiddleInverse(in uint threadId, in uint iteration, in uint logTwoN) 
 {
-    return nbl_glsl_complex_conjugate(nbl_glsl_ext_FFT_twiddle(threadId, iteration, logTwoN, N));
+    return nbl_glsl_complex_conjugate(nbl_glsl_ext_FFT_twiddle(threadId, iteration, logTwoN));
 }
 
 uint nbl_glsl_ext_FFT_getChannel()
@@ -124,7 +114,7 @@ uvec3 nbl_glsl_ext_FFT_getCoordinates(in uint tidx)
 
 uvec3 nbl_glsl_ext_FFT_getBitReversedCoordinates(in uvec3 coords, in uint leadingZeroes)
 {
-    uint bitReversedIndex = nbl_glsl_ext_FFT_reverseBits(coords[pc.direction]) >> leadingZeroes;
+    uint bitReversedIndex = bitfieldReverse(coords[pc.direction]) >> leadingZeroes;
     uvec3 tmp = coords;
     tmp[pc.direction] = bitReversedIndex;
     return tmp;
@@ -145,7 +135,7 @@ void nbl_glsl_ext_FFT()
 	uint channel = nbl_glsl_ext_FFT_getChannel();
     
 	// Pass 0: Bit Reversal
-	uint leadingZeroes = nbl_glsl_ext_FFT_clz(dataLength) + 1u;
+	uint leadingZeroes = nbl_glsl_clz(dataLength) + 1u;
 	uint logTwo = 32u - leadingZeroes;
 	
     nbl_glsl_complex current_values[_NBL_GLSL_EXT_FFT_MAX_ITEMS_PER_THREAD];
@@ -203,8 +193,8 @@ void nbl_glsl_ext_FFT()
             nbl_glsl_complex shuffled_value = shuffled_values[t];
 
             nbl_glsl_complex twiddle = (0u == pc.is_inverse) 
-             ? nbl_glsl_ext_FFT_twiddle(tid, i, logTwo, dataLength)
-             : nbl_glsl_ext_FFT_twiddleInverse(tid, i, logTwo, dataLength);
+             ? nbl_glsl_ext_FFT_twiddle(tid, i, logTwo)
+             : nbl_glsl_ext_FFT_twiddleInverse(tid, i, logTwo);
 
             nbl_glsl_complex this_value = current_values[t];
 
diff --git a/include/nbl/builtin/glsl/math/functions.glsl b/include/nbl/builtin/glsl/math/functions.glsl
@@ -244,6 +244,12 @@ uint nbl_glsl_rotl(in uint x, in uint k)
 	return (x<<k) | (x>>(32u-k));
 }
 
+// Count Leading Zeroes (naive?)
+uint nbl_glsl_clz(in uint x) 
+{
+    return 31u - findMSB(x);
+}
+
 
 // trig