117 lines
3.5 KiB
C
117 lines
3.5 KiB
C
// This file is part of the FidelityFX SDK.
|
|
//
|
|
// Copyright (C) 2024 Advanced Micro Devices, Inc.
|
|
//
|
|
// Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
// of this software and associated documentation files(the "Software"), to deal
|
|
// in the Software without restriction, including without limitation the rights
|
|
// to use, copy, modify, merge, publish, distribute, sublicense, and /or sell
|
|
// copies of the Software, and to permit persons to whom the Software is
|
|
// furnished to do so, subject to the following conditions :
|
|
//
|
|
// The above copyright notice and this permission notice shall be included in
|
|
// all copies or substantial portions of the Software.
|
|
//
|
|
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
// THE SOFTWARE.
|
|
|
|
#define GROUP_SIZE 8
|
|
#define FSR_RCAS_DENOISE 1
|
|
|
|
#include "ffx_core.h"
|
|
|
|
#if FFX_HALF
|
|
#define FSR_RCAS_HX2 1
|
|
FfxFloat16x4 FsrRcasLoadHx2(FfxInt16x2 p)
|
|
{
|
|
return LoadRCas_Input(p);
|
|
}
|
|
void FsrRcasInputHx2(inout FfxFloat16x2 r,inout FfxFloat16x2 g,inout FfxFloat16x2 b) {}
|
|
#else
|
|
#define FSR_RCAS_F 1
|
|
FfxFloat32x4 FsrRcasLoadF(FfxInt32x2 p)
|
|
{
|
|
return LoadRCas_Input(p);
|
|
}
|
|
void FsrRcasInputF(inout FfxFloat32 r, inout FfxFloat32 g, inout FfxFloat32 b) {}
|
|
#endif // FFX_HALF
|
|
|
|
#if FFX_FSR1_OPTION_RCAS_PASSTHROUGH_ALPHA
|
|
#define FSR_RCAS_PASSTHROUGH_ALPHA
|
|
#endif // FFX_FSR1_OPTION_RCAS_PASSTHROUGH_ALPHA
|
|
|
|
#include "fsr1/ffx_fsr1.h"
|
|
|
|
void CurrFilter(FFX_MIN16_U2 pos)
|
|
{
|
|
#if FFX_HALF
|
|
|
|
#if FFX_FSR1_OPTION_RCAS_PASSTHROUGH_ALPHA
|
|
FfxFloat16x2 cr, cg, cb, ca;
|
|
FsrRcasHx2(cr, cg, cb, ca, pos, RCasConfig());
|
|
#else
|
|
FfxFloat16x2 cr, cg, cb;
|
|
FsrRcasHx2(cr, cg, cb, pos, RCasConfig());
|
|
#endif // FFX_FSR1_OPTION_RCAS_PASSTHROUGH_ALPHA
|
|
|
|
if (RCasSample().x == 1)
|
|
{
|
|
cr *= cr;
|
|
cg *= cg;
|
|
cb *= cb;
|
|
}
|
|
|
|
#if FFX_FSR1_OPTION_RCAS_PASSTHROUGH_ALPHA
|
|
StoreRCasOutputHx2(FfxInt16x2(pos), cr, cg, cb, ca);
|
|
#else
|
|
StoreRCasOutputHx2(FfxInt16x2(pos), cr, cg, cb, FfxFloat16x2(1.0, 1.0));
|
|
#endif
|
|
|
|
#else
|
|
|
|
#if FFX_FSR1_OPTION_RCAS_PASSTHROUGH_ALPHA
|
|
FfxFloat32x4 c;
|
|
FsrRcasF(c.r, c.g, c.b, c.a, pos, RCasConfig());
|
|
#else
|
|
FfxFloat32x3 c;
|
|
FsrRcasF(c.r, c.g, c.b, pos, RCasConfig());
|
|
#endif // FFX_FSR1_OPTION_RCAS_PASSTHROUGH_ALPHA
|
|
if (RCasSample().x == 1)
|
|
{
|
|
c *= c;
|
|
}
|
|
|
|
#if FFX_FSR1_OPTION_RCAS_PASSTHROUGH_ALPHA
|
|
StoreRCasOutput(FfxInt32x2(pos), c);
|
|
#else
|
|
StoreRCasOutput(FfxInt32x2(pos), FfxFloat32x4(c, 1.0));
|
|
#endif
|
|
|
|
#endif
|
|
}
|
|
|
|
void RCAS(FfxUInt32x3 LocalThreadId, FfxUInt32x3 WorkGroupId, FfxUInt32x3 Dtid)
|
|
{
|
|
// Do remapping of local xy in workgroup for a more PS-like swizzle pattern.
|
|
FfxUInt32x2 gxy = ffxRemapForQuad(LocalThreadId.x) + FfxUInt32x2(WorkGroupId.x << 4u, WorkGroupId.y << 4u);
|
|
#if FFX_HALF
|
|
// packed version process left and right 8x8 tile, in total 16x8 region
|
|
CurrFilter(FFX_MIN16_U2(gxy));
|
|
gxy.y += 8u;
|
|
CurrFilter(FFX_MIN16_U2(gxy));
|
|
#else
|
|
CurrFilter(FFX_MIN16_U2(gxy));
|
|
gxy.x += 8u;
|
|
CurrFilter(FFX_MIN16_U2(gxy));
|
|
gxy.y += 8u;
|
|
CurrFilter(FFX_MIN16_U2(gxy));
|
|
gxy.x -= 8u;
|
|
CurrFilter(FFX_MIN16_U2(gxy));
|
|
#endif
|
|
}
|