// This file is part of the FidelityFX SDK. // // Copyright (C) 2024 Advanced Micro Devices, Inc. // // Permission is hereby granted, free of charge, to any person obtaining a copy // of this software and associated documentation files(the "Software"), to deal // in the Software without restriction, including without limitation the rights // to use, copy, modify, merge, publish, distribute, sublicense, and /or sell // copies of the Software, and to permit persons to whom the Software is // furnished to do so, subject to the following conditions : // // The above copyright notice and this permission notice shall be included in // all copies or substantial portions of the Software. // // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR // IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, // FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE // AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER // LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, // OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN // THE SOFTWARE. #define GROUP_SIZE 8 #define FSR_RCAS_DENOISE 1 #include "ffx_core.h" #if FFX_HALF #define FSR_RCAS_HX2 1 FfxFloat16x4 FsrRcasLoadHx2(FfxInt16x2 p) { return LoadRCas_Input(p); } void FsrRcasInputHx2(inout FfxFloat16x2 r,inout FfxFloat16x2 g,inout FfxFloat16x2 b) {} #else #define FSR_RCAS_F 1 FfxFloat32x4 FsrRcasLoadF(FfxInt32x2 p) { return LoadRCas_Input(p); } void FsrRcasInputF(inout FfxFloat32 r, inout FfxFloat32 g, inout FfxFloat32 b) {} #endif // FFX_HALF #if FFX_FSR1_OPTION_RCAS_PASSTHROUGH_ALPHA #define FSR_RCAS_PASSTHROUGH_ALPHA #endif // FFX_FSR1_OPTION_RCAS_PASSTHROUGH_ALPHA #include "fsr1/ffx_fsr1.h" void CurrFilter(FFX_MIN16_U2 pos) { #if FFX_HALF #if FFX_FSR1_OPTION_RCAS_PASSTHROUGH_ALPHA FfxFloat16x2 cr, cg, cb, ca; FsrRcasHx2(cr, cg, cb, ca, pos, RCasConfig()); #else FfxFloat16x2 cr, cg, cb; FsrRcasHx2(cr, cg, cb, pos, RCasConfig()); #endif // FFX_FSR1_OPTION_RCAS_PASSTHROUGH_ALPHA if (RCasSample().x == 1) { cr *= cr; cg *= cg; cb *= cb; } #if FFX_FSR1_OPTION_RCAS_PASSTHROUGH_ALPHA StoreRCasOutputHx2(FfxInt16x2(pos), cr, cg, cb, ca); #else StoreRCasOutputHx2(FfxInt16x2(pos), cr, cg, cb, FfxFloat16x2(1.0, 1.0)); #endif #else #if FFX_FSR1_OPTION_RCAS_PASSTHROUGH_ALPHA FfxFloat32x4 c; FsrRcasF(c.r, c.g, c.b, c.a, pos, RCasConfig()); #else FfxFloat32x3 c; FsrRcasF(c.r, c.g, c.b, pos, RCasConfig()); #endif // FFX_FSR1_OPTION_RCAS_PASSTHROUGH_ALPHA if (RCasSample().x == 1) { c *= c; } #if FFX_FSR1_OPTION_RCAS_PASSTHROUGH_ALPHA StoreRCasOutput(FfxInt32x2(pos), c); #else StoreRCasOutput(FfxInt32x2(pos), FfxFloat32x4(c, 1.0)); #endif #endif } void RCAS(FfxUInt32x3 LocalThreadId, FfxUInt32x3 WorkGroupId, FfxUInt32x3 Dtid) { // Do remapping of local xy in workgroup for a more PS-like swizzle pattern. FfxUInt32x2 gxy = ffxRemapForQuad(LocalThreadId.x) + FfxUInt32x2(WorkGroupId.x << 4u, WorkGroupId.y << 4u); #if FFX_HALF // packed version process left and right 8x8 tile, in total 16x8 region CurrFilter(FFX_MIN16_U2(gxy)); gxy.y += 8u; CurrFilter(FFX_MIN16_U2(gxy)); #else CurrFilter(FFX_MIN16_U2(gxy)); gxy.x += 8u; CurrFilter(FFX_MIN16_U2(gxy)); gxy.y += 8u; CurrFilter(FFX_MIN16_U2(gxy)); gxy.x -= 8u; CurrFilter(FFX_MIN16_U2(gxy)); #endif }