TexConv/CMP_Core/shaders/cas_main.hlsl

80 lines
2.5 KiB
HLSL

// LICENSE
// =======
// Copyright (c) 2019-2021 Advanced Micro Devices, Inc. All rights reserved.
// -------
// Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation
// files (the "Software"), to deal in the Software without restriction, including without limitation the rights to use, copy,
// modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the
// Software is furnished to do so, subject to the following conditions:
// -------
// The above copyright notice and this permission notice shall be included in all copies or substantial portions of the
// Software.
// -------
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE
// WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR
// COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
// ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
cbuffer cb : register(b0)
{
uint4 const0;
uint4 const1;
};
Texture2D InputTexture;
RWTexture2D<float4> OutputTexture;
#define A_GPU 1
#define A_HLSL 1
#define USE_CMP_FIDELITY_FX_H
#include "common_def.h"
AF3 CasLoad(ASU2 p)
{
return InputTexture.Load(int3(p, 0)).rgb;
}
void CasInput(inout AF1 r,inout AF1 g,inout AF1 b)
{
if(!LINEAR)
{
r = AFromSrgbF1(r);
g = AFromSrgbF1(g);
b = AFromSrgbF1(b);
}
}
#include "ffx_cas.h"
void StoreOutput(ASU2 p, AF3 value)
{
if(!LINEAR)
{
value = AF3(AToSrgbF1(value.r), AToSrgbF1(value.g), AToSrgbF1(value.b));
}
OutputTexture[p] = AF4(value.r, value.g, value.b, 1);
}
[numthreads(64, 1, 1)]
void mainCS(uint3 LocalThreadId : SV_GroupThreadID, uint3 WorkGroupId : SV_GroupID)
{
// Do remapping of local xy in workgroup for a more PS-like swizzle pattern.
AU2 gxy = ARmp8x8(LocalThreadId.x) + AU2(WorkGroupId.x << 4u, WorkGroupId.y << 4u);
// Filter.
AF3 c;
CasFilter(c.r, c.g, c.b, gxy, const0, const1, NO_SCALING);
StoreOutput(ASU2(gxy), c);
gxy.x += 8u;
CasFilter(c.r, c.g, c.b, gxy, const0, const1, NO_SCALING);
StoreOutput(ASU2(gxy), c);
gxy.y += 8u;
CasFilter(c.r, c.g, c.b, gxy, const0, const1, NO_SCALING);
StoreOutput(ASU2(gxy), c);
gxy.x -= 8u;
CasFilter(c.r, c.g, c.b, gxy, const0, const1, NO_SCALING);
StoreOutput(ASU2(gxy), c);
}