Add multiple scattering correction for dielectrics

pezcode · pezcode · commit 248ce2516e66 · 2020-10-22T03:14:09.000+02:00
diff --git a/src/Renderer/PBRShader.cpp b/src/Renderer/PBRShader.cpp
@@ -114,11 +114,10 @@ void PBRShader::generateAlbedoLUT()
             bgfx::blit(1, readbackTexture, 0, 0, albedoLUTTexture);
 
             char* mem = new char[w * h * 4];
-            bgfx::readTexture(readbackTexture, mem, 0);
+            uint64_t frame = bgfx::readTexture(readbackTexture, mem, 0);
 
-            // wait two frames for result to be available and write it to a file
-            bgfx::frame();
-            bgfx::frame();
+            // wait for result to be available and write it to a file
+            while(bgfx::frame() < frame) { }
 
             bx::FileWriter writer;
             if(writer.open(file, false, &err))
diff --git a/src/Renderer/Shaders/cs_multiple_scattering_lut.sc b/src/Renderer/Shaders/cs_multiple_scattering_lut.sc
@@ -6,6 +6,8 @@
 
 // compute shader to calculate a lookup table for multiple scattering correction
 
+// TODO fix black pixels at grazing angles (NaN?)
+
 // Turquin. 2018. Practical multiple scattering compensation for microfacet models.
 // https://blog.selfshadow.com/publications/turquin/ms_comp_final.pdf
 
@@ -16,8 +18,8 @@
 #define LUT_SIZE 32
 #define THREADS LUT_SIZE
 
-// number of samples for approximating the albedo integral
-#define NUM_SAMPLES 2048
+// number of samples for approximating the integral
+#define NUM_SAMPLES 1024
 
 // http://holger.dammertz.org/stuff/notes_HammersleyOnHemisphere.html
 vec2 hammersley_2d(uint i, uint N)
@@ -27,40 +29,38 @@ vec2 hammersley_2d(uint i, uint N)
     bits = ((bits & 0x33333333u) << 2u) | ((bits & 0xCCCCCCCCu) >> 2u);
     bits = ((bits & 0x0F0F0F0Fu) << 4u) | ((bits & 0xF0F0F0F0u) >> 4u);
     bits = ((bits & 0x00FF00FFu) << 8u) | ((bits & 0xFF00FF00u) >> 8u);
-    float ri = float(bits) * 2.3283064365386963e-10; // / uintBitsToFloat(0x100000000);
+    float ri = float(bits) * 2.3283064365386963e-10; // / (1.0 << 32)
     return vec2(float(i) / float(N), ri);
 }
 
-// map two random variables in [0;1] to a point on a hemisphere centered around N = y
+// map from [0;1] to a cosine weighted distribution on a hemisphere centered around N = y
 // http://holger.dammertz.org/stuff/notes_HammersleyOnHemisphere.html
-vec3 sampleHemisphere(vec2 Xi)
+vec3 sampleHemisphereCosine(vec2 Xi)
 {
     // turn Xi into spherical coordinates
     // azimuthal angle (360°)
     float phi = Xi.y * 2.0 * PI;
     // polar angle (90°)
     // 1-u to map the first sample (0) in the Hammersley sequence to 1=cos(0°)=up
-    float cosTheta = 1.0 - Xi.x;
+    float cosTheta = sqrt(1.0 - Xi.x);
     float sinTheta = sqrt(1.0 - cosTheta * cosTheta);
+
     // to cartesian coordinates, y is up
     return vec3(
         cos(phi) * sinTheta,
         cosTheta,
         sin(phi) * sinTheta);
 }
 
-// same thing, but importance sampled for the GGX NDF
-// return values is the half-way vector H
-vec3 importanceSampleGGX(vec2 Xi, float roughness)
+// importance sample the hemisphere for the GGX NDF instead
+// return value is the half-way vector H
+// a is perceptual roughness squared
+vec3 sampleGGX(vec2 Xi, float a)
 {
-    float a = roughness * roughness;
-
-    // Sample in spherical coordinates
     float phi = 2.0 * PI * Xi.y;
     float cosTheta = sqrt((1.0 - Xi.x) / (1.0 + (a * a - 1.0) * Xi.x));
     float sinTheta = sqrt(1.0 - cosTheta * cosTheta);
 
-    // to cartesian coordinates, y is up
     return vec3(
         cos(phi) * sinTheta,
         cosTheta,
@@ -69,84 +69,74 @@ vec3 importanceSampleGGX(vec2 Xi, float roughness)
 
 #define IMPORTANCE_SAMPLE_BRDF 1
 
-// calculate the albedo for a perfectly reflective surface (F0 = 1)
-// = the irradiance reflected towards the eye position from uniform
-// lighting over the hemisphere
-float albedo(float NoV, float roughness)
+// calculate the directional albedo = the irradiance reflected towards the eye position
+// from uniform lighting over the hemisphere
+float albedo_specular(vec3 V, float NoV, PBRMaterial mat)
 {
-	vec3 V;
-    V.x = sqrt(1.0 - NoV * NoV); // sin
-    V.y = NoV; // cos
-    V.z = 0.0;
-
     // N points straight upwards (y) for this integration
     const vec3 N = vec3(0.0, 1.0, 0.0);
 
     float E = 0.0;
 
-    // fixed F0 -> perfectly reflective surface
-    // only valid for metals, for dielectrics this needs to be a 3D LUT with F0 as a parameter
-    // we could possibly fix F0 at 0.04 like GLTF does, and write a second channel in the LUT
-    // how does this work with lerping with the metallic factor?
-    const vec3 F0 = vec3_splat(1.0);
+    // Monte-Carlo sampling for numerically integrating the directional albedo
+    // E(V) = integral(brdf(V,L) * dot(N,L))
 
-    // Monte-Carlo sampling for numerically integrating the albedo over the hemisphere
-    // a(V) = integral(brdf(V, L) * dot(N,L))
     for(uint i = 0; i < NUM_SAMPLES; i++)
     {
         // quasirandom values in [0;1]
         // is there a better distribution we can use?
         // see http://extremelearning.com.au/unreasonable-effectiveness-of-quasirandom-sequences/
         vec2 Xi = hammersley_2d(i, NUM_SAMPLES);
 
-        #if IMPORTANCE_SAMPLE_BRDF
-
         // sample microfacet direction
         // this returns H because we sample the NDF, which is the distribution of microfacets, which reflect around H
-        // apparently the PDF needs the 4*VoH denominator (related to the Jacobian)
-        // clarify!
-        vec3 H = importanceSampleGGX(Xi, roughness);
+        // then the PDF needs the 4*VoH denominator since we evaluate L (related to the Jacobian)
+        vec3 H = sampleGGX(Xi, mat.a);
 
         // get the light direction
         vec3 L = 2.0 * dot(V, H) * H - V;
 
-        #else
-
-        vec3 L = sampleHemisphere(Xi);
-        vec3 H = normalize(V + L);
-
-        #endif
-
         float NoL = saturate(dot(N, L));
         float NoH = saturate(dot(N, H));
         float VoH = saturate(dot(V, H));
 
-        // specular BRDF
-
-        float a = roughness * roughness;
-        
-        float F = F_Schlick(VoH, F0).x;
-        float VF = V_SmithGGXCorrelated(NoV, NoL, a);
-        float D = D_GGX(NoH, a);
+        // evaluate BRDF
 
-        #if IMPORTANCE_SAMPLE_BRDF
+        float F = F_Schlick(VoH, mat.F0).x;
+        float VF = V_SmithGGXCorrelated(NoV, NoL, mat.a);
+        float D = D_GGX(NoH, mat.a);
 
         //float Fr = F * VF * D;
-        //float pdf = D * NoH / (4.0 * VoH);
-        //E += Fr * NoL / pdf;
+        //float inv_pdf = (4.0 * VoH) / (D * NoH);
+        //E += Fr * NoL * inv_pdf;
         // -> D cancels out
 
-        E += F * VF * NoL * (4.0 * VoH) / NoH;
+        E += F * VF * NoL * 4.0 * VoH / NoH;
+    }
 
-        #else
+    return E / float(NUM_SAMPLES);
+}
 
-        // this kind of converges at massive sample rates (1 million +)
-        // but for low angles and high roughness the output is off
-        // investigate!
-        float pdf = 0.5 * INV_PI;
-        E += F * VF * D * NoL / pdf;
+float albedo_diffuse(vec3 V, float NoV, PBRMaterial mat)
+{
+    float E = 0.0;
+
+    for(uint i = 0; i < NUM_SAMPLES; i++)
+    {
+        vec2 Xi = hammersley_2d(i, NUM_SAMPLES);
+
+        vec3 L = sampleHemisphereCosine(Xi);
+        vec3 H = normalize(V + L);
+
+        float VoH = saturate(dot(V, H));
 
-        #endif
+        float F = F_Schlick(VoH, mat.F0).x;
+
+        // Fr = (1 - F) * C * (1/pi) * NoL
+        // float inv_pdf = pi/NoL
+        // -> 1/pi and NoL cancel out
+
+        E += (1.0 - F) * mat.diffuseColor.x;
     }
 
     return E / float(NUM_SAMPLES);
@@ -160,9 +150,27 @@ void main()
 
     float NoV = values.x;
     float roughness = values.y;
-    float result = albedo(NoV, roughness);
 
-    result = saturate(result);
+    vec3 V;
+    V.x = sqrt(1.0 - NoV * NoV); // sin
+    V.y = NoV; // cos
+    V.z = 0.0;
+
+    PBRMaterial mat;
+    // D3D compiler insists we initialize everything
+    mat.normal = vec3(0.0, 1.0, 0.0);
+    mat.occlusion = 0.0;
+    mat.emissive = vec3_splat(0.0);
+    mat.albedo = vec4_splat(1.0);
+    mat.roughness = roughness;
+
+    mat.metallic = 1.0; // F0 = albedo -> perfectly reflective surface
+    mat = pbrInitMaterial(mat);
+    float albedo_metal = albedo_specular(V, NoV, mat);
+
+    mat.metallic = 0.0; // F0 = 0.04
+    mat = pbrInitMaterial(mat);
+    float albedo_dielectric = albedo_specular(V, NoV, mat) + albedo_diffuse(V, NoV, mat);
 
-    imageStore(i_texAlbedoLUT, coords, vec4(result, result, result, 1.0));
+    imageStore(i_texAlbedoLUT, coords, vec4(albedo_metal, albedo_dielectric, 0.0, 1.0));
 }
diff --git a/src/Renderer/Shaders/pbr.sh b/src/Renderer/Shaders/pbr.sh
@@ -161,6 +161,8 @@ PBRMaterial pbrInitMaterial(PBRMaterial mat)
     mat.F0 = mix(dielectricSpecular, mat.albedo.rgb, mat.metallic);
     // perceptual roughness to roughness
     mat.a = mat.roughness * mat.roughness;
+    // prevent division by 0
+    mat.a = max(mat.a, 0.01);
 
     return mat;
 }
@@ -185,11 +187,7 @@ float specularAntiAliasing(vec3 N, float a)
     vec3 dndv = dFdy(N);
     float variance = SIGMA2 * (dot(dndu, dndu) + dot(dndv, dndv));
     float kernelRoughness2 = min(2.0 * variance, KAPPA);
-    float filteredRoughness2 = saturate(a + kernelRoughness2);
-    a = filteredRoughness2;
-
-    // Frostbite clamps roughness to 0.045 (0.045^2 = 0.002025)
-    return max(a, 0.002025);
+    return saturate(a + kernelRoughness2);
 }
 
 #endif
@@ -266,20 +264,20 @@ float Fd_Lambert()
 // https://blog.selfshadow.com/publications/turquin/ms_comp_final.pdf
 vec3 multipleScatteringFactor(PBRMaterial mat, float NoV)
 {
-    // E is the albedo for single scattering, ie. the total reflectance for a viewing direction
-    float E = texture2D(s_texAlbedoLUT, vec2(NoV, mat.a)).x;
-    vec3 factor = vec3_splat(1.0) + mat.F0 * (1.0/E - 1.0);
-
-    // TODO implement for dielectrics
-    // requires an extra dimension in the LUT texture
+    // Turquin approximates the multiple scattering portion of the BRDF using a scaled down version of the single scattering BRDF
+    // That scale factor is E: the directional albedo for single scattering, ie. the total reflectance for a viewing direction
+    vec2 E = texture2D(s_texAlbedoLUT, vec2(NoV, mat.a)).xy;
 
-    // for metals, the albedo value is calculated with F = 1
+    // for metals, the albedo value is calculated with F = 1 (perfect reflection)
     // fresnel determines whether light is reflected or absorbed
+    vec3 factorMetallic = vec3_splat(1.0) + mat.F0 * (1.0 / E.x - 1.0);
 
-    // for dielectrics, fresnel determines the ratio between two different albedos
+    // for dielectrics, fresnel determines the ratio between specular and diffuse energy
     // so the albedo depends on F as a variable
+    // however, dielectrics in GLTF have a fixed F0 of 0.04 so we can do this with a second LUT
+    vec3 factorDielectric = vec3_splat(1.0 / E.y);
 
-    return mix(vec3_splat(1.0), factor, mat.metallic);
+    return mix(factorDielectric, factorMetallic, mat.metallic);
 }
 
 #endif