diff --git a/LICENSE.txt b/LICENSE.txt
index f20b91b..4416f93 100644
--- a/LICENSE.txt
+++ b/LICENSE.txt
@@ -1,4 +1,4 @@
-Copyright (c) 2020 Advanced Micro Devices, Inc. All rights reserved.
+Copyright (c) 2021 Advanced Micro Devices, Inc. All rights reserved.
 
 Permission is hereby granted, free of charge, to any person obtaining a copy
 of this software and associated documentation files (the "Software"), to deal
diff --git a/README.md b/README.md
index 2f4c7fb..d42ed36 100644
--- a/README.md
+++ b/README.md
@@ -1,6 +1,6 @@
 # FidelityFX Denoiser
 
-Copyright (c) 2020 Advanced Micro Devices, Inc. All rights reserved.
+Copyright (c) 2021 Advanced Micro Devices, Inc. All rights reserved.
 Permission is hereby granted, free of charge, to any person obtaining a copy
 of this software and associated documentation files (the "Software"), to deal
 in the Software without restriction, including without limitation the rights
@@ -19,13 +19,24 @@ THE SOFTWARE.
 
 ## Overview
 
-FidelityFX Denoiser will contain a collection of highly optimized denoiser implementations for specific use cases.
+FidelityFX Denoiser contains a collection of highly optimized denoiser implementations for specific use cases.
 
-## FFX Reflection Denoiser
+## FidelityFX Shadow Denoiser
 
-The reflection denoiser includes a high performant Spatio-temporal denoiser specialized for reflection denoising.
+A spatio-temporal denoiser for raytraced soft shadows. It is intended to be used on a shadow mask that was created from at most one jittered shadow ray per pixel.
+It makes use of a tile classification pass to skip work on areas without spatial variance in the shadow mask.
+In cases of low temporal sample counts, the contribution from the spatial filters are increased, which successively cools off as the temporal sample count increases.
+The denoiser aims to avoid ghosting artifacts by analyzing the local pixel neighborhood and clamping the accumulated history.
+
+### Links
+
+- ffx-shadows-dnsr contains the [Shadow Denoiser](https://github.com/GPUOpen-Effects/FidelityFX-Denoiser/tree/master/ffx-shadows-dnsr)
+
+## FidelityFX Reflection Denoiser
+
+The reflection denoiser includes a high performance spatio-temporal denoiser specialized for reflection denoising.
 The preferred use case of this denoiser is within applications requiring denoised radiance values generated by some stochastic reflection implementation.
-Example of stochastic reflections:
+Examples of stochastic reflections:
 - Stochastic Screen Space Reflections
 - Stochastic Raytraced Reflections
 
@@ -34,5 +45,3 @@ Example of stochastic reflections:
 - ffx-reflection-dnsr contains the [Reflection Denoiser](https://github.com/GPUOpen-Effects/FidelityFX-Denoiser/tree/master/ffx-reflection-dnsr)
 - Visit [FidelityFX SSSR](https://github.com/GPUOpen-Effects/FidelityFX-SSSR/tree/master/sample) to see the reflection denoiser in action.
 
-## FFX Shadow Denoiser (Future Update)
-A denoiser optimized for raytraced shadows will be added here in a future update. If you are a developer working on a raytracing title then please contact your AMD representative for early access.
\ No newline at end of file
diff --git a/docs/FFX_Denoiser_Reflection_Technology.pdf b/docs/FFX_Denoiser_Reflection_Technology.pdf
index dbd37c0..30e85a6 100644
Binary files a/docs/FFX_Denoiser_Reflection_Technology.pdf and b/docs/FFX_Denoiser_Reflection_Technology.pdf differ
diff --git a/docs/FFX_Denoiser_Shadows_Technology.pdf b/docs/FFX_Denoiser_Shadows_Technology.pdf
new file mode 100644
index 0000000..051e6ad
Binary files /dev/null and b/docs/FFX_Denoiser_Shadows_Technology.pdf differ
diff --git a/ffx-reflection-dnsr/ffx_denoiser_reflections_blur.h b/ffx-reflection-dnsr/ffx_denoiser_reflections_blur.h
index b0a08d0..046862a 100644
--- a/ffx-reflection-dnsr/ffx_denoiser_reflections_blur.h
+++ b/ffx-reflection-dnsr/ffx_denoiser_reflections_blur.h
@@ -1,5 +1,5 @@
 /**********************************************************************
-Copyright (c) 2020 Advanced Micro Devices, Inc. All rights reserved.
+Copyright (c) 2021 Advanced Micro Devices, Inc. All rights reserved.
 
 Permission is hereby granted, free of charge, to any person obtaining a copy
 of this software and associated documentation files (the "Software"), to deal
diff --git a/ffx-reflection-dnsr/ffx_denoiser_reflections_classify_tiles.h b/ffx-reflection-dnsr/ffx_denoiser_reflections_classify_tiles.h
index b448684..c3abff9 100644
--- a/ffx-reflection-dnsr/ffx_denoiser_reflections_classify_tiles.h
+++ b/ffx-reflection-dnsr/ffx_denoiser_reflections_classify_tiles.h
@@ -1,5 +1,5 @@
 /**********************************************************************
-Copyright (c) 2020 Advanced Micro Devices, Inc. All rights reserved.
+Copyright (c) 2021 Advanced Micro Devices, Inc. All rights reserved.
 
 Permission is hereby granted, free of charge, to any person obtaining a copy
 of this software and associated documentation files (the "Software"), to deal
diff --git a/ffx-reflection-dnsr/ffx_denoiser_reflections_common.h b/ffx-reflection-dnsr/ffx_denoiser_reflections_common.h
index 32ee0e2..1ffd5ea 100644
--- a/ffx-reflection-dnsr/ffx_denoiser_reflections_common.h
+++ b/ffx-reflection-dnsr/ffx_denoiser_reflections_common.h
@@ -1,5 +1,5 @@
 /**********************************************************************
-Copyright (c) 2020 Advanced Micro Devices, Inc. All rights reserved.
+Copyright (c) 2021 Advanced Micro Devices, Inc. All rights reserved.
 
 Permission is hereby granted, free of charge, to any person obtaining a copy
 of this software and associated documentation files (the "Software"), to deal
diff --git a/ffx-reflection-dnsr/ffx_denoiser_reflections_resolve_spatial.h b/ffx-reflection-dnsr/ffx_denoiser_reflections_resolve_spatial.h
index 0b422af..956c6e5 100644
--- a/ffx-reflection-dnsr/ffx_denoiser_reflections_resolve_spatial.h
+++ b/ffx-reflection-dnsr/ffx_denoiser_reflections_resolve_spatial.h
@@ -1,5 +1,5 @@
 /**********************************************************************
-Copyright (c) 2020 Advanced Micro Devices, Inc. All rights reserved.
+Copyright (c) 2021 Advanced Micro Devices, Inc. All rights reserved.
 
 Permission is hereby granted, free of charge, to any person obtaining a copy
 of this software and associated documentation files (the "Software"), to deal
diff --git a/ffx-reflection-dnsr/ffx_denoiser_reflections_resolve_temporal.h b/ffx-reflection-dnsr/ffx_denoiser_reflections_resolve_temporal.h
index 11cb415..430b4d0 100644
--- a/ffx-reflection-dnsr/ffx_denoiser_reflections_resolve_temporal.h
+++ b/ffx-reflection-dnsr/ffx_denoiser_reflections_resolve_temporal.h
@@ -1,5 +1,5 @@
 /**********************************************************************
-Copyright (c) 2020 Advanced Micro Devices, Inc. All rights reserved.
+Copyright (c) 2021 Advanced Micro Devices, Inc. All rights reserved.
 
 Permission is hereby granted, free of charge, to any person obtaining a copy
 of this software and associated documentation files (the "Software"), to deal
diff --git a/ffx-shadows-dnsr/ffx_denoiser_shadows_filter.h b/ffx-shadows-dnsr/ffx_denoiser_shadows_filter.h
new file mode 100644
index 0000000..d29d07b
--- /dev/null
+++ b/ffx-shadows-dnsr/ffx_denoiser_shadows_filter.h
@@ -0,0 +1,273 @@
+/**********************************************************************
+Copyright (c) 2021 Advanced Micro Devices, Inc. All rights reserved.
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in
+all copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
+THE SOFTWARE.
+********************************************************************/
+
+#ifndef FFX_DNSR_SHADOWS_FILTER_HLSL
+#define FFX_DNSR_SHADOWS_FILTER_HLSL
+
+#include "ffx_denoiser_shadows_util.h"
+
+groupshared uint g_FFX_DNSR_Shadows_shared_input[16][16];
+groupshared float g_FFX_DNSR_Shadows_shared_depth[16][16];
+groupshared uint g_FFX_DNSR_Shadows_shared_normals_xy[16][16];
+groupshared uint g_FFX_DNSR_Shadows_shared_normals_zw[16][16];
+
+uint FFX_DNSR_Shadows_PackFloat16(float16_t2 v)
+{
+    uint2 p = f32tof16(float2(v));
+    return p.x | (p.y << 16);
+}
+
+float16_t2 FFX_DNSR_Shadows_UnpackFloat16(uint a)
+{
+    float2 tmp = f16tof32(
+        uint2(a & 0xFFFF, a >> 16));
+    return float16_t2(tmp);
+}
+
+float16_t2 FFX_DNSR_Shadows_LoadInputFromGroupSharedMemory(int2 idx)
+{
+    return FFX_DNSR_Shadows_UnpackFloat16(g_FFX_DNSR_Shadows_shared_input[idx.y][idx.x]);
+}
+
+float FFX_DNSR_Shadows_LoadDepthFromGroupSharedMemory(int2 idx)
+{
+    return g_FFX_DNSR_Shadows_shared_depth[idx.y][idx.x];
+}
+
+float16_t3 FFX_DNSR_Shadows_LoadNormalsFromGroupSharedMemory(int2 idx)
+{
+    float16_t3 normals;
+    normals.xy = FFX_DNSR_Shadows_UnpackFloat16(g_FFX_DNSR_Shadows_shared_normals_xy[idx.y][idx.x]);
+    normals.z = FFX_DNSR_Shadows_UnpackFloat16(g_FFX_DNSR_Shadows_shared_normals_zw[idx.y][idx.x]).x;
+    return normals;
+}
+
+void FFX_DNSR_Shadows_StoreInGroupSharedMemory(int2 idx, float16_t3 normals, float16_t2 input, float depth)
+{
+    g_FFX_DNSR_Shadows_shared_input[idx.y][idx.x] = FFX_DNSR_Shadows_PackFloat16(input);
+    g_FFX_DNSR_Shadows_shared_depth[idx.y][idx.x] = depth;
+    g_FFX_DNSR_Shadows_shared_normals_xy[idx.y][idx.x] = FFX_DNSR_Shadows_PackFloat16(normals.xy);
+    g_FFX_DNSR_Shadows_shared_normals_zw[idx.y][idx.x] = FFX_DNSR_Shadows_PackFloat16(float16_t2(normals.z, 0));
+}
+
+void FFX_DNSR_Shadows_LoadWithOffset(int2 did, int2 offset, out float16_t3 normals, out float16_t2 input, out float depth)
+{
+    did += offset;
+
+    const int2 p = clamp(did, int2(0, 0), FFX_DNSR_Shadows_GetBufferDimensions() - 1);
+    normals = FFX_DNSR_Shadows_ReadNormals(p);
+    input = FFX_DNSR_Shadows_ReadInput(p);
+    depth = FFX_DNSR_Shadows_ReadDepth(p);
+}
+
+void FFX_DNSR_Shadows_StoreWithOffset(int2 gtid, int2 offset, float16_t3 normals, float16_t2 input, float depth)
+{
+    gtid += offset;
+    FFX_DNSR_Shadows_StoreInGroupSharedMemory(gtid, normals, input, depth);
+}
+
+void FFX_DNSR_Shadows_InitializeGroupSharedMemory(int2 did, int2 gtid)
+{
+    int2 offset_0 = 0;
+    int2 offset_1 = int2(8, 0);
+    int2 offset_2 = int2(0, 8);
+    int2 offset_3 = int2(8, 8);
+
+    float16_t3 normals_0;
+    float16_t2 input_0;
+    float depth_0;
+
+    float16_t3 normals_1;
+    float16_t2 input_1;
+    float depth_1;
+
+    float16_t3 normals_2;
+    float16_t2 input_2;
+    float depth_2;
+
+    float16_t3 normals_3;
+    float16_t2 input_3;
+    float depth_3;
+
+    /// XA
+    /// BC
+
+    did -= 4;
+    FFX_DNSR_Shadows_LoadWithOffset(did, offset_0, normals_0, input_0, depth_0); // X
+    FFX_DNSR_Shadows_LoadWithOffset(did, offset_1, normals_1, input_1, depth_1); // A
+    FFX_DNSR_Shadows_LoadWithOffset(did, offset_2, normals_2, input_2, depth_2); // B
+    FFX_DNSR_Shadows_LoadWithOffset(did, offset_3, normals_3, input_3, depth_3); // C
+
+    FFX_DNSR_Shadows_StoreWithOffset(gtid, offset_0, normals_0, input_0, depth_0); // X
+    FFX_DNSR_Shadows_StoreWithOffset(gtid, offset_1, normals_1, input_1, depth_1); // A
+    FFX_DNSR_Shadows_StoreWithOffset(gtid, offset_2, normals_2, input_2, depth_2); // B
+    FFX_DNSR_Shadows_StoreWithOffset(gtid, offset_3, normals_3, input_3, depth_3); // C
+}
+
+float FFX_DNSR_Shadows_GetShadowSimilarity(float x1, float x2, float sigma)
+{
+    return exp(-abs(x1 - x2) / sigma);
+}
+
+float FFX_DNSR_Shadows_GetDepthSimilarity(float x1, float x2, float sigma)
+{
+    return exp(-abs(x1 - x2) / sigma);
+}
+
+float FFX_DNSR_Shadows_GetNormalSimilarity(float3 x1, float3 x2)
+{
+    return pow(saturate(dot(x1, x2)), 32.0f);
+}
+
+float FFX_DNSR_Shadows_GetLinearDepth(uint2 did, float depth)
+{
+    const float2 uv = (did + 0.5f) * FFX_DNSR_Shadows_GetInvBufferDimensions();
+    const float2 ndc = 2.0f * float2(uv.x, 1.0f - uv.y) - 1.0f;
+
+    float4 projected = mul(FFX_DNSR_Shadows_GetProjectionInverse(), float4(ndc, depth, 1));
+    return abs(projected.z / projected.w);
+}
+
+float FFX_DNSR_Shadows_FetchFilteredVarianceFromGroupSharedMemory(int2 pos)
+{
+    const int k = 1;
+    float variance = 0.0f;
+    const float kernel[2][2] =
+    {
+        { 1.0f / 4.0f, 1.0f / 8.0f  },
+        { 1.0f / 8.0f, 1.0f / 16.0f }
+    };
+    for (int y = -k; y <= k; ++y)
+    {
+        for (int x = -k; x <= k; ++x)
+        {
+            const float w = kernel[abs(x)][abs(y)];
+            variance += w * FFX_DNSR_Shadows_LoadInputFromGroupSharedMemory(pos + int2(x, y)).y;
+        }
+    }
+    return variance;
+}
+
+void FFX_DNSR_Shadows_DenoiseFromGroupSharedMemory(uint2 did, uint2 gtid, inout float weight_sum, inout float2 shadow_sum, float depth, uint stepsize)
+{
+    // Load our center sample
+    const float2 shadow_center = FFX_DNSR_Shadows_LoadInputFromGroupSharedMemory(gtid);
+    const float3 normal_center = FFX_DNSR_Shadows_LoadNormalsFromGroupSharedMemory(gtid);
+
+    weight_sum = 1.0f;
+    shadow_sum = shadow_center;
+
+    const float variance = FFX_DNSR_Shadows_FetchFilteredVarianceFromGroupSharedMemory(gtid);
+    const float std_deviation = sqrt(max(variance + 1e-9f, 0.0f));
+    const float depth_center = FFX_DNSR_Shadows_GetLinearDepth(did, depth);    // linearize the depth value
+
+    // Iterate filter kernel
+    const int k = 1;
+    const float kernel[3] = { 1.0f, 2.0f / 3.0f, 1.0f / 6.0f };
+
+    for (int y = -k; y <= k; ++y)
+    {
+        for (int x = -k; x <= k; ++x)
+        {
+            // Should we process this sample?
+            const int2 step = int2(x, y) * stepsize;
+            const int2 gtid_idx = gtid + step;
+            const int2 did_idx = did + step;
+
+            float depth_neigh = FFX_DNSR_Shadows_LoadDepthFromGroupSharedMemory(gtid_idx);
+            float3 normal_neigh = FFX_DNSR_Shadows_LoadNormalsFromGroupSharedMemory(gtid_idx);
+            float2 shadow_neigh = FFX_DNSR_Shadows_LoadInputFromGroupSharedMemory(gtid_idx);
+
+            float sky_pixel_multiplier = ((x == 0 && y == 0) || depth_neigh >= 1.0f || depth_neigh <= 0.0f) ? 0 : 1; // Zero weight for sky pixels
+
+            // Fetch our filtering values
+            depth_neigh = FFX_DNSR_Shadows_GetLinearDepth(did_idx, depth_neigh);
+
+            // Evaluate the edge-stopping function
+            float w = kernel[abs(x)] * kernel[abs(y)];  // kernel weight
+            w *= FFX_DNSR_Shadows_GetShadowSimilarity(shadow_center.x, shadow_neigh.x, std_deviation);
+            w *= FFX_DNSR_Shadows_GetDepthSimilarity(depth_center, depth_neigh, FFX_DNSR_Shadows_GetDepthSimilaritySigma());
+            w *= FFX_DNSR_Shadows_GetNormalSimilarity(normal_center, normal_neigh);
+            w *= sky_pixel_multiplier;
+
+            // Accumulate the filtered sample
+            shadow_sum += float2(w, w * w) * shadow_neigh;
+            weight_sum += w;
+        }
+    }
+}
+
+float2 FFX_DNSR_Shadows_ApplyFilterWithPrecache(uint2 did, uint2 gtid, uint stepsize)
+{
+    float weight_sum = 1.0;
+    float2 shadow_sum = 0.0;
+
+    FFX_DNSR_Shadows_InitializeGroupSharedMemory(did, gtid);
+    bool needs_denoiser = FFX_DNSR_Shadows_IsShadowReciever(did);
+    GroupMemoryBarrierWithGroupSync();
+    if (needs_denoiser)
+    {
+        float depth = FFX_DNSR_Shadows_ReadDepth(did);
+        gtid += 4; // Center threads in groupshared memory
+        FFX_DNSR_Shadows_DenoiseFromGroupSharedMemory(did, gtid, weight_sum, shadow_sum, depth, stepsize);
+    }
+
+    float mean = shadow_sum.x / weight_sum;
+    float variance = shadow_sum.y / (weight_sum * weight_sum);
+    return float2(mean, variance);
+}
+
+void FFX_DNSR_Shadows_ReadTileMetaData(uint2 gid, out bool is_cleared, out bool all_in_light)
+{
+    uint meta_data = FFX_DNSR_Shadows_ReadTileMetaData(gid.y * FFX_DNSR_Shadows_RoundedDivide(FFX_DNSR_Shadows_GetBufferDimensions().x, 8) + gid.x);
+    is_cleared = meta_data & TILE_META_DATA_CLEAR_MASK;
+    all_in_light = meta_data & TILE_META_DATA_LIGHT_MASK;
+}
+
+
+float2 FFX_DNSR_Shadows_FilterSoftShadowsPass(uint2 gid, uint2 gtid, uint2 did, out bool bWriteResults, uint const pass, uint const stepsize)
+{
+    bool is_cleared;
+    bool all_in_light;
+    FFX_DNSR_Shadows_ReadTileMetaData(gid, is_cleared, all_in_light);
+
+    bWriteResults = false;
+    float2 results = float2(0, 0);
+    [branch]
+    if (is_cleared)
+    {
+        if (pass != 1)
+        {
+            results.x = all_in_light ? 1.0 : 0.0;
+            bWriteResults = true;
+        }
+    }
+    else
+    {
+        results = FFX_DNSR_Shadows_ApplyFilterWithPrecache(did, gtid, stepsize);
+        bWriteResults = true;
+    }
+
+    return results;
+}
+
+#endif
diff --git a/ffx-shadows-dnsr/ffx_denoiser_shadows_prepare.h b/ffx-shadows-dnsr/ffx_denoiser_shadows_prepare.h
new file mode 100644
index 0000000..ea853fa
--- /dev/null
+++ b/ffx-shadows-dnsr/ffx_denoiser_shadows_prepare.h
@@ -0,0 +1,53 @@
+/**********************************************************************
+Copyright (c) 2021 Advanced Micro Devices, Inc. All rights reserved.
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in
+all copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
+THE SOFTWARE.
+********************************************************************/
+
+#ifndef FFX_DNSR_SHADOWS_PREPARESHADOWMASK_HLSL
+#define FFX_DNSR_SHADOWS_PREPARESHADOWMASK_HLSL
+
+#include "ffx_denoiser_shadows_util.h"
+
+void FFX_DNSR_Shadows_CopyResult(uint2 gtid, uint2 gid)
+{
+    const uint2 did = gid * uint2(8, 4) + gtid;
+    const uint linear_tile_index = FFX_DNSR_Shadows_LinearTileIndex(gid, FFX_DNSR_Shadows_GetBufferDimensions().x);
+    const bool hit_light = FFX_DNSR_Shadows_HitsLight(did, gtid, gid);
+    const uint lane_mask = hit_light ? FFX_DNSR_Shadows_GetBitMaskFromPixelPosition(did) : 0;
+    FFX_DNSR_Shadows_WriteMask(linear_tile_index, WaveActiveBitOr(lane_mask));
+}
+ 
+void FFX_DNSR_Shadows_PrepareShadowMask(uint2 gtid, uint2 gid)
+{
+    gid *= 4;
+    uint2 tile_dimensions = (FFX_DNSR_Shadows_GetBufferDimensions() + uint2(7, 3)) / uint2(8, 4);
+
+    for (int i = 0; i < 4; ++i)
+    {
+        for (int j = 0; j < 4; ++j)
+        {
+            uint2 tile_id = uint2(gid.x + i, gid.y + j);
+            tile_id = clamp(tile_id, 0, tile_dimensions - 1);
+            FFX_DNSR_Shadows_CopyResult(gtid, tile_id);
+        }
+    }
+}
+
+#endif
diff --git a/ffx-shadows-dnsr/ffx_denoiser_shadows_tileclassification.h b/ffx-shadows-dnsr/ffx_denoiser_shadows_tileclassification.h
new file mode 100644
index 0000000..9c3cc37
--- /dev/null
+++ b/ffx-shadows-dnsr/ffx_denoiser_shadows_tileclassification.h
@@ -0,0 +1,425 @@
+/**********************************************************************
+Copyright (c) 2021 Advanced Micro Devices, Inc. All rights reserved.
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in
+all copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
+THE SOFTWARE.
+********************************************************************/
+
+#ifndef FFX_DNSR_SHADOWS_TILECLASSIFICATION_HLSL
+#define FFX_DNSR_SHADOWS_TILECLASSIFICATION_HLSL
+
+#include "ffx_denoiser_shadows_util.h"
+
+groupshared int g_FFX_DNSR_Shadows_false_count;
+bool FFX_DNSR_Shadows_ThreadGroupAllTrue(bool val)
+{
+    const uint lane_count_in_thread_group = 64;
+    if (WaveGetLaneCount() == lane_count_in_thread_group)
+    {
+        return WaveActiveAllTrue(val);
+    }
+    else
+    {
+        GroupMemoryBarrierWithGroupSync();
+        g_FFX_DNSR_Shadows_false_count = 0;
+        GroupMemoryBarrierWithGroupSync();
+        if (!val) g_FFX_DNSR_Shadows_false_count = 1;
+        GroupMemoryBarrierWithGroupSync();
+        return g_FFX_DNSR_Shadows_false_count == 0;
+    }
+}
+
+void FFX_DNSR_Shadows_SearchSpatialRegion(uint2 gid, out bool all_in_light, out bool all_in_shadow)
+{
+    // The spatial passes can reach a total region of 1+2+4 = 7x7 around each block.
+    // The masks are 8x4, so we need a larger vertical stride
+
+    // Visualization - each x represents a 4x4 block, xx is one entire 8x4 mask as read from the raytracer result
+    // Same for yy, these are the ones we are working on right now
+
+    // xx xx xx
+    // xx xx xx
+    // xx yy xx <-- yy here is the base_tile below
+    // xx yy xx
+    // xx xx xx
+    // xx xx xx
+
+    // All of this should result in scalar ops
+    uint2 base_tile = FFX_DNSR_Shadows_GetTileIndexFromPixelPosition(gid * int2(8, 8));
+
+    // Load the entire region of masks in a scalar fashion
+    uint combined_or_mask = 0;
+    uint combined_and_mask = 0xFFFFFFFF;
+    for (int j = -2; j <= 3; ++j)
+    {
+        for (int i = -1; i <= 1; ++i)
+        {
+            int2 tile_index = base_tile + int2(i, j);
+            tile_index = clamp(tile_index, 0, int2(FFX_DNSR_Shadows_RoundedDivide(FFX_DNSR_Shadows_GetBufferDimensions().x, 8), FFX_DNSR_Shadows_RoundedDivide(FFX_DNSR_Shadows_GetBufferDimensions().y, 4)) - 1);
+            const uint linear_tile_index = FFX_DNSR_Shadows_LinearTileIndex(tile_index, FFX_DNSR_Shadows_GetBufferDimensions().x);
+            const uint shadow_mask = FFX_DNSR_Shadows_ReadRaytracedShadowMask(linear_tile_index);
+
+            combined_or_mask = combined_or_mask | shadow_mask;
+            combined_and_mask = combined_and_mask & shadow_mask;
+        }
+    }
+
+    all_in_light = combined_and_mask == 0xFFFFFFFFu;
+    all_in_shadow = combined_or_mask == 0u;
+}
+
+float FFX_DNSR_Shadows_GetLinearDepth(uint2 did, float depth)
+{
+    const float2 uv = (did + 0.5f) * FFX_DNSR_Shadows_GetInvBufferDimensions();
+    const float2 ndc = 2.0f * float2(uv.x, 1.0f - uv.y) - 1.0f;
+
+    float4 projected = mul(FFX_DNSR_Shadows_GetProjectionInverse(), float4(ndc, depth, 1));
+    return abs(projected.z / projected.w);
+}
+
+bool FFX_DNSR_Shadows_IsDisoccluded(uint2 did, float depth, float2 velocity)
+{
+    const int2 dims = FFX_DNSR_Shadows_GetBufferDimensions();
+    const float2 texel_size = FFX_DNSR_Shadows_GetInvBufferDimensions();
+    const float2 uv = (did + 0.5f) * texel_size;
+    const float2 ndc = (2.0f * uv - 1.0f) * float2(1.0f, -1.0f);
+    const float2 previous_uv = uv - velocity;
+
+    bool is_disoccluded = true;
+    if (all(previous_uv > 0.0) && all(previous_uv < 1.0))
+    {
+        // Read the center values
+        float3 normal = FFX_DNSR_Shadows_ReadNormals(did);
+
+        float4 clip_space = mul(FFX_DNSR_Shadows_GetReprojectionMatrix(), float4(ndc, depth, 1.0f));
+        clip_space /= clip_space.w; // perspective divide
+
+        // How aligned with the view vector? (the more Z aligned, the higher the depth errors)
+        const float4 homogeneous = mul(FFX_DNSR_Shadows_GetViewProjectionInverse(), float4(ndc, depth, 1.0f));
+        const float3 world_position = homogeneous.xyz / homogeneous.w;  // perspective divide
+        const float3 view_direction = normalize(FFX_DNSR_Shadows_GetEye().xyz - world_position);
+        float z_alignment = 1.0f - dot(view_direction, normal);
+        z_alignment = pow(z_alignment, 8);
+
+        // Calculate the depth difference
+        float linear_depth = FFX_DNSR_Shadows_GetLinearDepth(did, clip_space.z);   // get linear depth
+
+        int2 idx = previous_uv * dims;
+        const float previous_depth = FFX_DNSR_Shadows_GetLinearDepth(idx, FFX_DNSR_Shadows_ReadPreviousDepth(idx));
+        const float depth_difference = abs(previous_depth - linear_depth) / linear_depth;
+
+        // Resolve into the disocclusion mask
+        const float depth_tolerance = lerp(1e-2f, 1e-1f, z_alignment);
+        is_disoccluded = depth_difference >= depth_tolerance;
+    }
+
+    return is_disoccluded;
+}
+
+float2 FFX_DNSR_Shadows_GetClosestVelocity(int2 did, float depth)
+{
+    float2 closest_velocity = FFX_DNSR_Shadows_ReadVelocity(did);
+    float closest_depth = depth;
+
+    float new_depth = QuadReadAcrossX(closest_depth);
+    float2 new_velocity = QuadReadAcrossX(closest_velocity);
+#ifdef INVERTED_DEPTH_RANGE
+    if (new_depth > closest_depth)
+#else
+    if (new_depth < closest_depth)
+#endif
+    {
+        closest_depth = new_depth;
+        closest_velocity = new_velocity;
+    }
+
+    new_depth = QuadReadAcrossY(closest_depth);
+    new_velocity = QuadReadAcrossY(closest_velocity);
+#ifdef INVERTED_DEPTH_RANGE
+    if (new_depth > closest_depth)
+#else
+    if (new_depth < closest_depth)
+#endif
+    {
+        closest_depth = new_depth;
+        closest_velocity = new_velocity;
+    }
+
+    return closest_velocity * float2(0.5f, -0.5f);  // from ndc to uv
+}
+
+#define KERNEL_RADIUS 8
+float FFX_DNSR_Shadows_KernelWeight(float i)
+{
+#define KERNEL_WEIGHT(i) (exp(-3.0 * float(i * i) / ((KERNEL_RADIUS + 1.0) * (KERNEL_RADIUS + 1.0))))
+
+    // Statically initialize kernel_weights_sum
+    float kernel_weights_sum = 0;
+    kernel_weights_sum += KERNEL_WEIGHT(0);
+    for (int c = 1; c <= KERNEL_RADIUS; ++c)
+    {
+        kernel_weights_sum += 2 * KERNEL_WEIGHT(c); // Add other half of the kernel to the sum
+    }
+    float inv_kernel_weights_sum = rcp(kernel_weights_sum);
+
+    // The only runtime code in this function
+    return KERNEL_WEIGHT(i) * inv_kernel_weights_sum;
+}
+
+void FFX_DNSR_Shadows_AccumulateMoments(float value, float weight, inout float moments)
+{
+    // We get value from the horizontal neighborhood calculations. Thus, it's both mean and variance due to using one sample per pixel
+    moments += value * weight;
+}
+
+// The horizontal part of a 17x17 local neighborhood kernel
+float FFX_DNSR_Shadows_HorizontalNeighborhood(int2 did)
+{
+   const int2 base_did = did;
+
+    // Prevent vertical out of bounds access
+    if ((base_did.y < 0) || (base_did.y >= FFX_DNSR_Shadows_GetBufferDimensions().y)) return 0;
+
+    const uint2 tile_index = FFX_DNSR_Shadows_GetTileIndexFromPixelPosition(base_did);
+    const uint linear_tile_index = FFX_DNSR_Shadows_LinearTileIndex(tile_index, FFX_DNSR_Shadows_GetBufferDimensions().x);
+
+    const int left_tile_index = linear_tile_index - 1;
+    const int center_tile_index = linear_tile_index;
+    const int right_tile_index = linear_tile_index + 1;
+
+    bool is_first_tile_in_row = tile_index.x == 0;
+    bool is_last_tile_in_row = tile_index.x == (FFX_DNSR_Shadows_RoundedDivide(FFX_DNSR_Shadows_GetBufferDimensions().x, 8) - 1);
+
+    uint left_tile = 0;
+    if (!is_first_tile_in_row) left_tile = FFX_DNSR_Shadows_ReadRaytracedShadowMask(left_tile_index);
+    uint center_tile = FFX_DNSR_Shadows_ReadRaytracedShadowMask(center_tile_index);
+    uint right_tile = 0;
+    if (!is_last_tile_in_row) right_tile = FFX_DNSR_Shadows_ReadRaytracedShadowMask(right_tile_index);
+
+    // Construct a single uint with the lowest 17bits containing the horizontal part of the local neighborhood.
+
+    // First extract the 8 bits of our row in each of the neighboring tiles
+    const uint row_base_index = (did.y % 4) * 8;
+    const uint left = (left_tile >> row_base_index) & 0xFF;
+    const uint center = (center_tile >> row_base_index) & 0xFF;
+    const uint right = (right_tile >> row_base_index) & 0xFF;
+
+    // Combine them into a single mask containting [left, center, right] from least significant to most significant bit
+    uint neighborhood = left | (center << 8) | (right << 16);
+
+    // Make sure our pixel is at bit position 9 to get the highest contribution from the filter kernel
+    const uint bit_index_in_row = (did.x % 8);
+    neighborhood = neighborhood >> bit_index_in_row; // Shift out bits to the right, so the center bit ends up at bit 9.
+
+    float moment = 0.0; // For one sample per pixel this is both, mean and variance
+
+    // First 8 bits up to the center pixel
+    uint mask;
+    int i;
+    for (i = 0; i < 8; ++i)
+    {
+        mask = 1u << i;
+        moment += (mask & neighborhood) ? FFX_DNSR_Shadows_KernelWeight(8 - i) : 0;
+    }
+
+    // Center pixel
+    mask = 1u << 8;
+    moment += (mask & neighborhood) ? FFX_DNSR_Shadows_KernelWeight(0) : 0;
+
+    // Last 8 bits
+    for (i = 1; i <= 8; ++i)
+    {
+        mask = 1u << (8 + i);
+        moment += (mask & neighborhood) ? FFX_DNSR_Shadows_KernelWeight(i) : 0;
+    }
+
+    return moment;
+}
+
+groupshared float g_FFX_DNSR_Shadows_neighborhood[8][24];
+
+float FFX_DNSR_Shadows_ComputeLocalNeighborhood(int2 did, int2 gtid)
+{
+    float local_neighborhood = 0;
+
+    float upper = FFX_DNSR_Shadows_HorizontalNeighborhood(int2(did.x, did.y - 8));
+    float center = FFX_DNSR_Shadows_HorizontalNeighborhood(int2(did.x, did.y));
+    float lower = FFX_DNSR_Shadows_HorizontalNeighborhood(int2(did.x, did.y + 8));
+
+    g_FFX_DNSR_Shadows_neighborhood[gtid.x][gtid.y] = upper;
+    g_FFX_DNSR_Shadows_neighborhood[gtid.x][gtid.y + 8] = center;
+    g_FFX_DNSR_Shadows_neighborhood[gtid.x][gtid.y + 16] = lower;
+
+    GroupMemoryBarrierWithGroupSync();
+
+    // First combine the own values.
+    // KERNEL_RADIUS pixels up is own upper and KERNEL_RADIUS pixels down is own lower value
+    FFX_DNSR_Shadows_AccumulateMoments(center, FFX_DNSR_Shadows_KernelWeight(0), local_neighborhood);
+    FFX_DNSR_Shadows_AccumulateMoments(upper, FFX_DNSR_Shadows_KernelWeight(KERNEL_RADIUS), local_neighborhood);
+    FFX_DNSR_Shadows_AccumulateMoments(lower, FFX_DNSR_Shadows_KernelWeight(KERNEL_RADIUS), local_neighborhood);
+
+    // Then read the neighboring values.
+    for (int i = 1; i < KERNEL_RADIUS; ++i)
+    {
+        float upper_value = g_FFX_DNSR_Shadows_neighborhood[gtid.x][8 + gtid.y - i];
+        float lower_value = g_FFX_DNSR_Shadows_neighborhood[gtid.x][8 + gtid.y + i];
+        float weight = FFX_DNSR_Shadows_KernelWeight(i);
+        FFX_DNSR_Shadows_AccumulateMoments(upper_value, weight, local_neighborhood);
+        FFX_DNSR_Shadows_AccumulateMoments(lower_value, weight, local_neighborhood);
+    }
+
+    return local_neighborhood;
+}
+
+void FFX_DNSR_Shadows_WriteTileMetaData(uint2 gid, uint2 gtid, bool is_cleared, bool all_in_light)
+{
+    if (all(gtid == 0))
+    {
+        uint light_mask = all_in_light ? TILE_META_DATA_LIGHT_MASK : 0;
+        uint clear_mask = is_cleared ? TILE_META_DATA_CLEAR_MASK : 0;
+        uint mask = light_mask | clear_mask;
+        FFX_DNSR_Shadows_WriteMetadata(gid.y * FFX_DNSR_Shadows_RoundedDivide(FFX_DNSR_Shadows_GetBufferDimensions().x, 8) + gid.x, mask);
+    }
+}
+
+void FFX_DNSR_Shadows_ClearTargets(uint2 did, uint2 gtid, uint2 gid, float shadow_value, bool is_shadow_receiver, bool all_in_light)
+{
+    FFX_DNSR_Shadows_WriteTileMetaData(gid, gtid, true, all_in_light);
+    FFX_DNSR_Shadows_WriteReprojectionResults(did, float2(shadow_value, 0)); // mean, variance
+
+    float temporal_sample_count = is_shadow_receiver ? 1 : 0;
+    FFX_DNSR_Shadows_WriteMoments(did, float3(shadow_value, 0, temporal_sample_count));// mean, variance, temporal sample count
+}
+
+void FFX_DNSR_Shadows_TileClassification(uint group_index, uint2 gid)
+{
+    uint2 gtid = FFX_DNSR_Shadows_RemapLane8x8(group_index); // Make sure we can use the QuadReadAcross intrinsics to access a 2x2 region.
+    uint2 did = gid * 8 + gtid;
+
+    bool is_shadow_receiver = FFX_DNSR_Shadows_IsShadowReciever(did);
+
+    bool skip_sky = FFX_DNSR_Shadows_ThreadGroupAllTrue(!is_shadow_receiver);
+    if (skip_sky)
+    {
+        // We have to set all resources of the tile we skipped to sensible values as neighboring active denoiser tiles might want to read them.
+        FFX_DNSR_Shadows_ClearTargets(did, gtid, gid, 0, is_shadow_receiver, false);
+        return;
+    }
+
+    bool all_in_light = false;
+    bool all_in_shadow = false;
+    FFX_DNSR_Shadows_SearchSpatialRegion(gid, all_in_light, all_in_shadow);
+    float shadow_value = all_in_light ? 1 : 0; // Either all_in_light or all_in_shadow must be true, otherwise we would not skip the tile.
+
+    bool can_skip = all_in_light || all_in_shadow;
+    // We have to append the entire tile if there is a single lane that we can't skip
+    bool skip_tile = FFX_DNSR_Shadows_ThreadGroupAllTrue(can_skip);
+    if (skip_tile)
+    {
+        // We have to set all resources of the tile we skipped to sensible values as neighboring active denoiser tiles might want to read them.
+        FFX_DNSR_Shadows_ClearTargets(did, gtid, gid, shadow_value, is_shadow_receiver, all_in_light);
+        return;
+    }
+
+    FFX_DNSR_Shadows_WriteTileMetaData(gid, gtid, false, false);
+
+    float depth = FFX_DNSR_Shadows_ReadDepth(did);
+    const float2 velocity = FFX_DNSR_Shadows_GetClosestVelocity(did.xy, depth); // Must happen before we deactivate lanes
+    const float local_neighborhood = FFX_DNSR_Shadows_ComputeLocalNeighborhood(did, gtid);
+
+    const float2 texel_size = FFX_DNSR_Shadows_GetInvBufferDimensions();
+    const float2 uv = (did.xy + 0.5f) * texel_size;
+    const float2 history_uv = uv - velocity;
+    const int2 history_pos = history_uv * FFX_DNSR_Shadows_GetBufferDimensions();
+
+    const uint2 tile_index = FFX_DNSR_Shadows_GetTileIndexFromPixelPosition(did);
+    const uint linear_tile_index = FFX_DNSR_Shadows_LinearTileIndex(tile_index, FFX_DNSR_Shadows_GetBufferDimensions().x);
+
+    const uint shadow_tile = FFX_DNSR_Shadows_ReadRaytracedShadowMask(linear_tile_index);
+
+    float3 moments_current = 0;
+    float variance = 0;
+    float shadow_clamped = 0;
+    if (is_shadow_receiver) // do not process sky pixels
+    {
+        bool hit_light = shadow_tile & FFX_DNSR_Shadows_GetBitMaskFromPixelPosition(did);
+        const float shadow_current = hit_light ? 1.0 : 0.0;
+
+        // Perform moments and variance calculations
+        {
+            bool is_disoccluded = FFX_DNSR_Shadows_IsDisoccluded(did, depth, velocity);
+            const float3 previous_moments = is_disoccluded ? float3(0.0f, 0.0f, 0.0f) // Can't trust previous moments on disocclusion
+                : FFX_DNSR_Shadows_ReadPreviousMomentsBuffer(history_pos);
+
+            const float old_m = previous_moments.x;
+            const float old_s = previous_moments.y;
+            const float sample_count = previous_moments.z + 1.0f;
+            const float new_m = old_m + (shadow_current - old_m) / sample_count;
+            const float new_s = old_s + (shadow_current - old_m) * (shadow_current - new_m);
+
+            variance = (sample_count > 1.0f ? new_s / (sample_count - 1.0f) : 1.0f);
+            moments_current = float3(new_m, new_s, sample_count);
+        }
+
+        // Retrieve local neighborhood and reproject
+        {
+            float mean = local_neighborhood;
+            float spatial_variance = local_neighborhood;
+
+            spatial_variance = max(spatial_variance - mean * mean, 0.0f);
+
+            // Compute the clamping bounding box
+            const float std_deviation = sqrt(spatial_variance);
+            const float nmin = mean - 0.5f * std_deviation;
+            const float nmax = mean + 0.5f * std_deviation;
+
+            // Clamp reprojected sample to local neighborhood
+            float shadow_previous = shadow_current;
+            if (FFX_DNSR_Shadows_IsFirstFrame() == 0)
+            {
+                shadow_previous = FFX_DNSR_Shadows_ReadHistory(history_uv);
+            }
+
+            shadow_clamped = clamp(shadow_previous, nmin, nmax);
+
+            // Reduce history weighting
+            float const sigma = 20.0f;
+            float const temporal_discontinuity = (shadow_previous - mean) / max(0.5f * std_deviation, 0.001f);
+            float const sample_counter_damper = exp(-temporal_discontinuity * temporal_discontinuity / sigma);
+            moments_current.z *= sample_counter_damper;
+
+            // Boost variance on first frames
+            if (moments_current.z < 16.0f)
+            {
+                const float variance_boost = max(16.0f - moments_current.z, 1.0f);
+                variance = max(variance, spatial_variance);
+                variance *= variance_boost;
+            }
+        }
+
+        // Perform the temporal blend
+        const float history_weight = sqrt(max(8.0f - moments_current.z, 0.0f) / 8.0f);
+        shadow_clamped = lerp(shadow_clamped, shadow_current, lerp(0.05f, 1.0f, history_weight));
+    }
+
+    // Output the results of the temporal pass 
+    FFX_DNSR_Shadows_WriteReprojectionResults(did.xy, float2(shadow_clamped, variance));
+    FFX_DNSR_Shadows_WriteMoments(did.xy, moments_current);
+}
+
+#endif
diff --git a/ffx-shadows-dnsr/ffx_denoiser_shadows_util.h b/ffx-shadows-dnsr/ffx_denoiser_shadows_util.h
new file mode 100644
index 0000000..1726012
--- /dev/null
+++ b/ffx-shadows-dnsr/ffx_denoiser_shadows_util.h
@@ -0,0 +1,71 @@
+/**********************************************************************
+Copyright (c) 2021 Advanced Micro Devices, Inc. All rights reserved.
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in
+all copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
+THE SOFTWARE.
+********************************************************************/
+
+#ifndef FFX_DNSR_SHADOWS_UTILS_HLSL
+#define FFX_DNSR_SHADOWS_UTILS_HLSL
+
+uint FFX_DNSR_Shadows_RoundedDivide(uint value, uint divisor)
+{
+    return (value + divisor - 1) / divisor;
+}
+
+uint2 FFX_DNSR_Shadows_GetTileIndexFromPixelPosition(uint2 pixel_pos)
+{
+    return uint2(pixel_pos.x / 8, pixel_pos.y / 4);
+}
+
+uint FFX_DNSR_Shadows_LinearTileIndex(uint2 tile_index, uint screen_width)
+{
+    return tile_index.y * FFX_DNSR_Shadows_RoundedDivide(screen_width, 8) + tile_index.x;
+}
+
+uint FFX_DNSR_Shadows_GetBitMaskFromPixelPosition(uint2 pixel_pos)
+{
+    int lane_index = (pixel_pos.y % 4) * 8 + (pixel_pos.x % 8);
+    return (1u << lane_index);
+}
+
+#define TILE_META_DATA_CLEAR_MASK 0b01u
+#define TILE_META_DATA_LIGHT_MASK 0b10u
+
+// From ffx_a.h
+
+uint FFX_DNSR_Shadows_BitfieldExtract(uint src, uint off, uint bits) { uint mask = (1 << bits) - 1; return (src >> off) & mask; } // ABfe
+uint FFX_DNSR_Shadows_BitfieldInsert(uint src, uint ins, uint bits) { uint mask = (1 << bits) - 1; return (ins & mask) | (src & (~mask)); } // ABfiM
+
+//  LANE TO 8x8 MAPPING
+//  ===================
+//  00 01 08 09 10 11 18 19 
+//  02 03 0a 0b 12 13 1a 1b
+//  04 05 0c 0d 14 15 1c 1d
+//  06 07 0e 0f 16 17 1e 1f 
+//  20 21 28 29 30 31 38 39 
+//  22 23 2a 2b 32 33 3a 3b
+//  24 25 2c 2d 34 35 3c 3d
+//  26 27 2e 2f 36 37 3e 3f 
+uint2 FFX_DNSR_Shadows_RemapLane8x8(uint lane) {
+    return uint2(FFX_DNSR_Shadows_BitfieldInsert(FFX_DNSR_Shadows_BitfieldExtract(lane, 2u, 3u), lane, 1u)
+        , FFX_DNSR_Shadows_BitfieldInsert(FFX_DNSR_Shadows_BitfieldExtract(lane, 3u, 3u)
+            , FFX_DNSR_Shadows_BitfieldExtract(lane, 1u, 2u), 2u));
+}
+
+#endif