refactor traceRay

devshgraphicsprogramming · devshgraphicsprogramming · commit 9ea21b4810f3 · 2021-03-12T18:26:15.000+01:00
diff --git a/examples_tests/42.FragmentShaderPathTracer/common.glsl b/examples_tests/42.FragmentShaderPathTracer/common.glsl
@@ -313,7 +313,6 @@ Light lights[LIGHT_COUNT] =
 struct ImmutableRay_t
 {
     vec3 origin;
-    float maxT;
     vec3 direction;
 #if defined(TRIANGLE_METHOD)||defined(RECTANGLE_METHOD)
     vec3 normalAtOrigin;
@@ -375,21 +374,13 @@ void missProgram(in ImmutableRay_t _immutable, inout Payload_t _payload)
 {
     vec3 finalContribution = _payload.throughput; 
     //#define USE_ENVMAP
-    // true miss
-    if (_immutable.maxT>=FLT_MAX)
-    {
-        #ifdef USE_ENVMAP
-	        vec2 uv = SampleSphericalMap(_immutable.direction);
-            finalContribution *= textureLod(envMap, uv, 0.0).rgb;
-        #else
-        const vec3 kConstantEnvLightRadiance = vec3(0.15, 0.21, 0.3);
-            finalContribution *= kConstantEnvLightRadiance;
-        #endif
-    }
-    else
-    {
-        finalContribution *= _payload.otherTechniqueHeuristic;
-    }
+#ifdef USE_ENVMAP
+	vec2 uv = SampleSphericalMap(_immutable.direction);
+    finalContribution *= textureLod(envMap, uv, 0.0).rgb;
+#else
+    const vec3 kConstantEnvLightRadiance = vec3(0.15, 0.21, 0.3);
+    finalContribution *= kConstantEnvLightRadiance;
+#endif
     _payload.accumulation += finalContribution;
 }
 
@@ -493,7 +484,7 @@ mat2x3 rand3d(in uint protoDimension, in uint _sample, inout nbl_glsl_xoroshiro6
     return retval;
 }
 
-void traceRay(in bool anyHit, in ImmutableRay_t _immutable, inout MutableRay_t _mutable);
+int traceRay(inout float intersectionT, in ImmutableRay_t _immutable);
 bool closestHitProgram(in uint depth, in uint _sample, inout Ray_t ray, inout nbl_glsl_xoroshiro64star_state_t scramble_state);
 
 void main()
@@ -520,6 +511,7 @@ void main()
 
     vec3 color = vec3(0.0);
     float meanLumaSquared = 0.0;
+    // TODO: if we collapse the nested for loop, then all GPUs will get `MAX_DEPTH` factor speedup, not just NV with separate PC
     for (int i=0; i<SAMPLES; i++)
     {
         nbl_glsl_xoroshiro64star_state_t scramble_state = scramble_start_state;
@@ -528,7 +520,6 @@ void main()
         // raygen
         {
             ray._immutable.origin = camPos;
-            ray._immutable.maxT = FLT_MAX;
 
             vec4 tmp = NDC;
             // apply stochastic reconstruction filter
@@ -555,19 +546,20 @@ void main()
             #endif
         }
 
-        // trace
-        for (int j=1; j<=MAX_DEPTH; j+=2)
+        // bounces
         {
-            const ImmutableRay_t _immutable = ray._immutable;
-            traceRay(false,_immutable,ray._mutable);
-                
-            if (ray._mutable.intersectionT>=_immutable.maxT)
+            bool hit = true; bool rayAlive = true;
+            for (int d=1; d<=MAX_DEPTH && hit && rayAlive; d+=2)
             {
-                missProgram(_immutable,ray._payload);
-                break;
+                ray._mutable.intersectionT = FLT_MAX;
+                ray._mutable.objectID = traceRay(ray._mutable.intersectionT,ray._immutable);
+                hit = ray._mutable.objectID!=-1;
+                if (hit)
+                    rayAlive = closestHitProgram(3u, i, ray, scramble_state);
             }
-            else if (closestHitProgram(j,i,ray,scramble_state))
-                break;
+            // was last trace a miss?
+            if (!hit)
+                missProgram(ray._immutable,ray._payload);
         }
 
         vec3 accumulation = ray._payload.accumulation;
diff --git a/examples_tests/42.FragmentShaderPathTracer/litBySphere.frag b/examples_tests/42.FragmentShaderPathTracer/litBySphere.frag
@@ -10,10 +10,9 @@
 
 
 
-void traceRay(in bool anyHit, in ImmutableRay_t _immutable, inout MutableRay_t _mutable)
+int traceRay(inout float intersectionT, in ImmutableRay_t _immutable)
 {
 	int objectID = -1;
-    float intersectionT = _immutable.maxT;
 	for (int i=0; i<SPHERE_COUNT; i++)
     {
         float t = Sphere_intersect(spheres[i],_immutable.origin,_immutable.direction);
@@ -26,8 +25,7 @@ void traceRay(in bool anyHit, in ImmutableRay_t _immutable, inout MutableRay_t _
         //if (anyHit && closerIntersection && anyHitProgram(_immutable))
            //break;
     }
-    _mutable.objectID = objectID;
-    _mutable.intersectionT = intersectionT;
+    return objectID;
 }
 
 #if 0
@@ -87,12 +85,12 @@ bool closestHitProgram(in uint depth, in uint _sample, inout Ray_t ray, inout nb
     const uint bsdfLightIDs = sphere.bsdfLightIDs;
 
     vec3 throughput = ray._payload.throughput;
-    
+#if 1
     // add emissive
     const uint lightID = bitfieldExtract(bsdfLightIDs,16,16);
     if (lightID!=INVALID_ID_16BIT) // has emissive
         ray._payload.accumulation += throughput*Light_getRadiance(lights[lightID]);
-
+#endif
     // check if we even have a BSDF at all
     uint bsdfID = bitfieldExtract(bsdfLightIDs,0,16);
     if (bsdfID!=INVALID_ID_16BIT)
@@ -130,7 +128,6 @@ bool closestHitProgram(in uint depth, in uint _sample, inout Ray_t ray, inout nb
 
     
 
-        float maxT = FLT_MAX;
         nbl_glsl_AnisotropicMicrofacetCache _cache;
 
         // do I need this?
@@ -156,12 +153,11 @@ bool closestHitProgram(in uint depth, in uint _sample, inout Ray_t ray, inout nb
                     
             // trace new ray
             ray._immutable.origin = intersection+bsdfSampleL*(1.0/*kSceneSize*/)*getStartTolerance(depth);
-            ray._immutable.maxT = maxT;
             ray._immutable.direction = bsdfSampleL;
-            return false;
+            return true;
         }
     }
-    return true;
+    return false;
 }
 #if 0
 bool closestHitProgram(in uint depth, in uint _sample, inout Ray_t ray, inout nbl_glsl_xoroshiro64star_state_t scramble_state)