You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
 
 
 
 

89 lines
3.1 KiB

// This file is part of the FidelityFX SDK.
//
// Copyright (C) 2024 Advanced Micro Devices, Inc.
//
// Permission is hereby granted, free of charge, to any person obtaining a copy
// of this software and associated documentation files(the "Software"), to deal
// in the Software without restriction, including without limitation the rights
// to use, copy, modify, merge, publish, distribute, sublicense, and /or sell
// copies of the Software, and to permit persons to whom the Software is
// furnished to do so, subject to the following conditions :
//
// The above copyright notice and this permission notice shall be included in
// all copies or substantial portions of the Software.
//
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
// THE SOFTWARE.
#include "../ffx_core.h"
#if FFX_HALF
#define FFX_CAS_PACKED_ONLY 1
#endif // FFX_HALF
#include "ffx_cas.h"
void Sharpen(FfxUInt32x3 LocalThreadId, FfxUInt32x3 WorkGroupId, FfxUInt32x3 Dtid)
{
// Do remapping of local xy in workgroup for a more PS-like swizzle pattern.
FfxUInt32x2 gxy = ffxRemapForQuad(LocalThreadId.x) + FfxUInt32x2(WorkGroupId.x << 4u, WorkGroupId.y << 4u);
FfxBoolean sharpenOnly;
#if FFX_CAS_OPTION_SHARPEN_ONLY
sharpenOnly = true;
#else
sharpenOnly = false;
#endif // FFX_CAS_OPTION_SHARPEN_ONLY
#if FFX_HALF
// Filter.
FfxFloat16x4 c0, c1;
FfxFloat16x2 cR, cG, cB;
ffxCasFilterHalf(cR, cG, cB, gxy, Const0(), Const1(), sharpenOnly);
casOutputHalf(cR, cG, cB);
ffxCasDepackHalf(c0, c1, cR, cG, cB);
casStoreOutput(FfxInt32x2(gxy), FfxFloat32x4(c0));
casStoreOutput(FfxInt32x2(gxy) + FfxInt32x2(8, 0), FfxFloat32x4(c1));
gxy.y += 8u;
ffxCasFilterHalf(cR, cG, cB, gxy, Const0(), Const1(), sharpenOnly);
casOutputHalf(cR, cG, cB);
ffxCasDepackHalf(c0, c1, cR, cG, cB);
casStoreOutput(FfxInt32x2(gxy), FfxFloat32x4(c0));
casStoreOutput(FfxInt32x2(gxy) + FfxInt32x2(8, 0), FfxFloat32x4(c1));
#else
// Filter.
FfxFloat32x3 c;
ffxCasFilter(c.r, c.g, c.b, gxy, Const0(), Const1(), sharpenOnly);
casOutput(c.r, c.g, c.b);
casStoreOutput(FfxInt32x2(gxy), FfxFloat32x4(c, 1));
gxy.x += 8u;
ffxCasFilter(c.r, c.g, c.b, gxy, Const0(), Const1(), sharpenOnly);
casOutput(c.r, c.g, c.b);
casStoreOutput(FfxInt32x2(gxy), FfxFloat32x4(c, 1));
gxy.y += 8u;
ffxCasFilter(c.r, c.g, c.b, gxy, Const0(), Const1(), sharpenOnly);
casOutput(c.r, c.g, c.b);
casStoreOutput(FfxInt32x2(gxy), FfxFloat32x4(c, 1));
gxy.x -= 8u;
ffxCasFilter(c.r, c.g, c.b, gxy, Const0(), Const1(), sharpenOnly);
casOutput(c.r, c.g, c.b);
casStoreOutput(FfxInt32x2(gxy), FfxFloat32x4(c, 1));
#endif // FFX_HALF
}