mirror of
https://github.com/GreemDev/Ryujinx.git
synced 2024-12-20 22:05:53 +01:00
21c9ac6240
* Implement storage buffer operations using new Load/Store instruction * Extend GenerateMultiTargetStorageOp to also match access with constant offset, and log and comments * Remove now unused code * Catch more complex cases of global memory usage * Shader cache version bump * Extend global access elimination to work with more shared memory cases * Change alignment requirement from 16 bytes to 8 bytes, handle cases where we need more than 16 storage buffers * Tweak preferencing to catch more cases * Enable CB0 elimination even when host storage buffer alignment is > 16 (for Intel) * Fix storage buffer bindings * Simplify some code * Shader cache version bump * Fix typo * Extend global memory elimination to handle shared memory with multiple possible offsets and local memory
141 lines
5.4 KiB
C#
141 lines
5.4 KiB
C#
using Ryujinx.Graphics.Shader.IntermediateRepresentation;
|
|
using System;
|
|
using System.Collections.Generic;
|
|
|
|
using static Ryujinx.Graphics.Shader.IntermediateRepresentation.OperandHelper;
|
|
|
|
namespace Ryujinx.Graphics.Shader.Translation
|
|
{
|
|
class HelperFunctionManager
|
|
{
|
|
private readonly List<Function> _functionList;
|
|
private readonly Dictionary<HelperFunctionName, int> _functionIds;
|
|
private readonly ShaderStage _stage;
|
|
|
|
public HelperFunctionManager(List<Function> functionList, ShaderStage stage)
|
|
{
|
|
_functionList = functionList;
|
|
_functionIds = new Dictionary<HelperFunctionName, int>();
|
|
_stage = stage;
|
|
}
|
|
|
|
public int AddFunction(Function function)
|
|
{
|
|
int functionId = _functionList.Count;
|
|
_functionList.Add(function);
|
|
|
|
return functionId;
|
|
}
|
|
|
|
public int GetOrCreateFunctionId(HelperFunctionName functionName)
|
|
{
|
|
if (_functionIds.TryGetValue(functionName, out int functionId))
|
|
{
|
|
return functionId;
|
|
}
|
|
|
|
Function function = GenerateFunction(functionName);
|
|
functionId = AddFunction(function);
|
|
_functionIds.Add(functionName, functionId);
|
|
|
|
return functionId;
|
|
}
|
|
|
|
private Function GenerateFunction(HelperFunctionName functionName)
|
|
{
|
|
return functionName switch
|
|
{
|
|
HelperFunctionName.TexelFetchScale => GenerateTexelFetchScaleFunction(),
|
|
HelperFunctionName.TextureSizeUnscale => GenerateTextureSizeUnscaleFunction(),
|
|
_ => throw new ArgumentException($"Invalid function name {functionName}")
|
|
};
|
|
}
|
|
|
|
private Function GenerateTexelFetchScaleFunction()
|
|
{
|
|
EmitterContext context = new EmitterContext();
|
|
|
|
Operand input = Argument(0);
|
|
Operand samplerIndex = Argument(1);
|
|
Operand index = GetScaleIndex(context, samplerIndex);
|
|
|
|
Operand scale = context.Load(StorageKind.ConstantBuffer, 0, Const((int)SupportBufferField.RenderScale), index);
|
|
|
|
Operand scaleIsOne = context.FPCompareEqual(scale, ConstF(1f));
|
|
Operand lblScaleNotOne = Label();
|
|
|
|
context.BranchIfFalse(lblScaleNotOne, scaleIsOne);
|
|
context.Return(input);
|
|
context.MarkLabel(lblScaleNotOne);
|
|
|
|
int inArgumentsCount;
|
|
|
|
if (_stage == ShaderStage.Fragment)
|
|
{
|
|
Operand scaleIsLessThanZero = context.FPCompareLess(scale, ConstF(0f));
|
|
Operand lblScaleGreaterOrEqualZero = Label();
|
|
|
|
context.BranchIfFalse(lblScaleGreaterOrEqualZero, scaleIsLessThanZero);
|
|
|
|
Operand negScale = context.FPNegate(scale);
|
|
Operand inputScaled = context.FPMultiply(context.IConvertS32ToFP32(input), negScale);
|
|
Operand fragCoordX = context.Load(StorageKind.Input, IoVariable.FragmentCoord, null, Const(0));
|
|
Operand fragCoordY = context.Load(StorageKind.Input, IoVariable.FragmentCoord, null, Const(1));
|
|
Operand fragCoord = context.ConditionalSelect(Argument(2), fragCoordY, fragCoordX);
|
|
Operand inputBias = context.FPModulo(fragCoord, negScale);
|
|
Operand inputWithBias = context.FPAdd(inputScaled, inputBias);
|
|
|
|
context.Return(context.FP32ConvertToS32(inputWithBias));
|
|
context.MarkLabel(lblScaleGreaterOrEqualZero);
|
|
|
|
inArgumentsCount = 3;
|
|
}
|
|
else
|
|
{
|
|
inArgumentsCount = 2;
|
|
}
|
|
|
|
Operand inputScaled2 = context.FPMultiply(context.IConvertS32ToFP32(input), scale);
|
|
|
|
context.Return(context.FP32ConvertToS32(inputScaled2));
|
|
|
|
return new Function(ControlFlowGraph.Create(context.GetOperations()).Blocks, "TexelFetchScale", true, inArgumentsCount, 0);
|
|
}
|
|
|
|
private Function GenerateTextureSizeUnscaleFunction()
|
|
{
|
|
EmitterContext context = new EmitterContext();
|
|
|
|
Operand input = Argument(0);
|
|
Operand samplerIndex = Argument(1);
|
|
Operand index = GetScaleIndex(context, samplerIndex);
|
|
|
|
Operand scale = context.FPAbsolute(context.Load(StorageKind.ConstantBuffer, 0, Const((int)SupportBufferField.RenderScale), index));
|
|
|
|
Operand scaleIsOne = context.FPCompareEqual(scale, ConstF(1f));
|
|
Operand lblScaleNotOne = Label();
|
|
|
|
context.BranchIfFalse(lblScaleNotOne, scaleIsOne);
|
|
context.Return(input);
|
|
context.MarkLabel(lblScaleNotOne);
|
|
|
|
Operand inputUnscaled = context.FPDivide(context.IConvertS32ToFP32(input), scale);
|
|
|
|
context.Return(context.FP32ConvertToS32(inputUnscaled));
|
|
|
|
return new Function(ControlFlowGraph.Create(context.GetOperations()).Blocks, "TextureSizeUnscale", true, 2, 0);
|
|
}
|
|
|
|
private Operand GetScaleIndex(EmitterContext context, Operand index)
|
|
{
|
|
switch (_stage)
|
|
{
|
|
case ShaderStage.Vertex:
|
|
Operand fragScaleCount = context.Load(StorageKind.ConstantBuffer, 0, Const((int)SupportBufferField.FragmentRenderScaleCount));
|
|
return context.IAdd(Const(1), context.IAdd(index, fragScaleCount));
|
|
default:
|
|
return context.IAdd(Const(1), index);
|
|
}
|
|
}
|
|
}
|
|
} |