precompute values in linear, bilinear sampling; make box muller a struct

keptsecret · keptsecret · commit 31342543116f · 2025-11-18T17:11:12.000+07:00
diff --git a/include/nbl/builtin/hlsl/sampling/bilinear.hlsl b/include/nbl/builtin/hlsl/sampling/bilinear.hlsl
@@ -28,13 +28,13 @@ struct Bilinear
     {
         Bilinear<T> retval;
         retval.bilinearCoeffs = bilinearCoeffs;
+        retval.twiceAreasUnderXCurve = vector2_type(bilinearCoeffs[0] + bilinearCoeffs[1], bilinearCoeffs[2] + bilinearCoeffs[3]);
         return retval;
     }
 
     vector2_type generate(NBL_REF_ARG(scalar_type) rcpPdf, NBL_CONST_REF_ARG(vector2_type) _u)
     {
         vector2_type u = _u;
-        const vector2_type twiceAreasUnderXCurve = vector2_type(bilinearCoeffs[0] + bilinearCoeffs[1], bilinearCoeffs[2] + bilinearCoeffs[3]);
         Linear<scalar_type> lineary = Linear<scalar_type>::create(twiceAreasUnderXCurve);
         u.y = lineary.generate(u.y);
 
@@ -52,7 +52,10 @@ struct Bilinear
         return 4.0 * nbl::hlsl::mix(nbl::hlsl::mix(bilinearCoeffs[0], bilinearCoeffs[1], u.x), nbl::hlsl::mix(bilinearCoeffs[2], bilinearCoeffs[3], u.x), u.y) / (bilinearCoeffs[0] + bilinearCoeffs[1] + bilinearCoeffs[2] + bilinearCoeffs[3]);
     }
 
-    vector4_type bilinearCoeffs;
+    // unit square: x0y0    x1y0
+    //              x0y1    x1y1
+    vector4_type bilinearCoeffs;    // (x0y0, x0y1, x1y0, x1y1)
+    vector2_type twiceAreasUnderXCurve;
 };
 
 }
diff --git a/include/nbl/builtin/hlsl/sampling/box_muller_transform.hlsl b/include/nbl/builtin/hlsl/sampling/box_muller_transform.hlsl
@@ -2,8 +2,8 @@
 // This file is part of the "Nabla Engine".
 // For conditions of distribution and use, see copyright notice in nabla.h
 
-#ifndef _NBL_BUILTIN_HLSL_BOX_MULLER_TRANSFORM_INCLUDED_
-#define _NBL_BUILTIN_HLSL_BOX_MULLER_TRANSFORM_INCLUDED_
+#ifndef _NBL_BUILTIN_HLSL_SAMPLING_BOX_MULLER_TRANSFORM_INCLUDED_
+#define _NBL_BUILTIN_HLSL_SAMPLING_BOX_MULLER_TRANSFORM_INCLUDED_
 
 #include "nbl/builtin/hlsl/math/functions.hlsl"
 #include "nbl/builtin/hlsl/numbers.hlsl"
@@ -12,15 +12,26 @@ namespace nbl
 {
 namespace hlsl
 {
+namespace sampling
+{
 
-template<typename T>
-vector<T,2> boxMullerTransform(vector<T,2> xi, T stddev)
+template<typename T NBL_PRIMARY_REQUIRES(concepts::FloatingPointLikeScalar<T>)
+struct BoxMullerTransform
 {
-    T sinPhi, cosPhi;
-    math::sincos<T>(2.0 * numbers::pi<float> * xi.y - numbers::pi<float>, sinPhi, cosPhi);
-    return vector<T,2>(cosPhi, sinPhi) * nbl::hlsl::sqrt(-2.0 * nbl::hlsl::log(xi.x)) * stddev;
-}
+    using scalar_type = T;
+    using vector2_type = vector<T,2>;
+
+    vector2_type operator()(vector2_type xi)
+    {
+        scalar_type sinPhi, cosPhi;
+        math::sincos<scalar_type>(2.0 * numbers::pi<scalar_type> * xi.y - numbers::pi<scalar_type>, sinPhi, cosPhi);
+        return vector2_type(cosPhi, sinPhi) * nbl::hlsl::sqrt(-2.0 * nbl::hlsl::log(xi.x)) * stddev;
+    }
 
+    T stddev;
+};
+
+}
 }
 }
 
diff --git a/include/nbl/builtin/hlsl/sampling/linear.hlsl b/include/nbl/builtin/hlsl/sampling/linear.hlsl
@@ -21,21 +21,26 @@ struct Linear
     using scalar_type = T;
     using vector2_type = vector<T, 2>;
 
-    static Linear<T> create(NBL_CONST_REF_ARG(vector2_type) linearCoeffs)
+    static Linear<T> create(NBL_CONST_REF_ARG(vector2_type) linearCoeffs)   // start and end importance values (start, end)
     {
         Linear<T> retval;
-        retval.linearCoeffs = linearCoeffs;
+        retval.linearCoeffStart = linearCoeffs[0];
+        retval.rcpDiff = 1.0 / (linearCoeffs[0] - linearCoeffs[1]);
+        vector2_type squaredCoeffs = linearCoeffs * linearCoeffs;
+        retval.squaredCoeffStart = squaredCoeffs[0];
+        retval.squaredCoeffDiff = squaredCoeffs[1] - squaredCoeffs[0];
         return retval;
     }
 
     scalar_type generate(scalar_type u)
     {
-        const scalar_type rcpDiff = 1.0 / (linearCoeffs[0] - linearCoeffs[1]);
-        const vector2_type squaredCoeffs = linearCoeffs * linearCoeffs;
-        return nbl::hlsl::abs(rcpDiff) < numeric_limits<scalar_type>::max ? (linearCoeffs[0] - nbl::hlsl::sqrt(nbl::hlsl::mix(squaredCoeffs[0], squaredCoeffs[1], u))) * rcpDiff : u;
+        return hlsl::mix(u, (linearCoeffStart - hlsl::sqrt(squaredCoeffStart + u * squaredCoeffDiff)) * rcpDiff, hlsl::abs(rcpDiff) < numeric_limits<scalar_type>::max);
     }
 
-    vector2_type linearCoeffs;
+    scalar_type linearCoeffStart;  
+    scalar_type rcpDiff;
+    scalar_type squaredCoeffStart;
+    scalar_type squaredCoeffDiff;
 };
 
 }

Original file line number	Diff line number	Diff line change
`@@ -28,13 +28,13 @@ struct Bilinear`
`28`	`28`	`{`
`29`	`29`	`Bilinear<T> retval;`
`30`	`30`	`retval.bilinearCoeffs = bilinearCoeffs;`
	`31`	`+ retval.twiceAreasUnderXCurve = vector2_type(bilinearCoeffs[0] + bilinearCoeffs[1], bilinearCoeffs[2] + bilinearCoeffs[3]);`
`31`	`32`	`return retval;`
`32`	`33`	`}`
`33`	`34`
`34`	`35`	`vector2_type generate(NBL_REF_ARG(scalar_type) rcpPdf, NBL_CONST_REF_ARG(vector2_type) _u)`
`35`	`36`	`{`
`36`	`37`	`vector2_type u = _u;`
`37`		`- const vector2_type twiceAreasUnderXCurve = vector2_type(bilinearCoeffs[0] + bilinearCoeffs[1], bilinearCoeffs[2] + bilinearCoeffs[3]);`
`38`	`38`	`Linear<scalar_type> lineary = Linear<scalar_type>::create(twiceAreasUnderXCurve);`
`39`	`39`	`u.y = lineary.generate(u.y);`
`40`	`40`
`@@ -52,7 +52,10 @@ struct Bilinear`
`52`	`52`	`return 4.0 * nbl::hlsl::mix(nbl::hlsl::mix(bilinearCoeffs[0], bilinearCoeffs[1], u.x), nbl::hlsl::mix(bilinearCoeffs[2], bilinearCoeffs[3], u.x), u.y) / (bilinearCoeffs[0] + bilinearCoeffs[1] + bilinearCoeffs[2] + bilinearCoeffs[3]);`
`53`	`53`	`}`
`54`	`54`
`55`		`- vector4_type bilinearCoeffs;`
	`55`	`+ // unit square: x0y0 x1y0`
	`56`	`+ // x0y1 x1y1`
	`57`	`+ vector4_type bilinearCoeffs; // (x0y0, x0y1, x1y0, x1y1)`
	`58`	`+ vector2_type twiceAreasUnderXCurve;`
`56`	`59`	`};`
`57`	`60`
`58`	`61`	`}`
Original file line number	Diff line number	Diff line change
`@@ -21,21 +21,26 @@ struct Linear`
`21`	`21`	`using scalar_type = T;`
`22`	`22`	`using vector2_type = vector<T, 2>;`
`23`	`23`
`24`		`- static Linear<T> create(NBL_CONST_REF_ARG(vector2_type) linearCoeffs)`
	`24`	`+ static Linear<T> create(NBL_CONST_REF_ARG(vector2_type) linearCoeffs) // start and end importance values (start, end)`
`25`	`25`	`{`
`26`	`26`	`Linear<T> retval;`
`27`		`- retval.linearCoeffs = linearCoeffs;`
	`27`	`+ retval.linearCoeffStart = linearCoeffs[0];`
	`28`	`+ retval.rcpDiff = 1.0 / (linearCoeffs[0] - linearCoeffs[1]);`
	`29`	`+ vector2_type squaredCoeffs = linearCoeffs * linearCoeffs;`
	`30`	`+ retval.squaredCoeffStart = squaredCoeffs[0];`
	`31`	`+ retval.squaredCoeffDiff = squaredCoeffs[1] - squaredCoeffs[0];`
`28`	`32`	`return retval;`
`29`	`33`	`}`
`30`	`34`
`31`	`35`	`scalar_type generate(scalar_type u)`
`32`	`36`	`{`
`33`		`- const scalar_type rcpDiff = 1.0 / (linearCoeffs[0] - linearCoeffs[1]);`
`34`		`- const vector2_type squaredCoeffs = linearCoeffs * linearCoeffs;`
`35`		`- return nbl::hlsl::abs(rcpDiff) < numeric_limits<scalar_type>::max ? (linearCoeffs[0] - nbl::hlsl::sqrt(nbl::hlsl::mix(squaredCoeffs[0], squaredCoeffs[1], u))) * rcpDiff : u;`
	`37`	`+ return hlsl::mix(u, (linearCoeffStart - hlsl::sqrt(squaredCoeffStart + u * squaredCoeffDiff)) * rcpDiff, hlsl::abs(rcpDiff) < numeric_limits<scalar_type>::max);`
`36`	`38`	`}`
`37`	`39`
`38`		`- vector2_type linearCoeffs;`
	`40`	`+ scalar_type linearCoeffStart;`
	`41`	`+ scalar_type rcpDiff;`
	`42`	`+ scalar_type squaredCoeffStart;`
	`43`	`+ scalar_type squaredCoeffDiff;`
`39`	`44`	`};`
`40`	`45`
`41`	`46`	`}`