mirror of
https://github.com/Ryujinx/Ryujinx.git
synced 2024-12-28 22:23:23 +01:00
2df16ded9b
* Improve shader BRX instruction code generation * Shader cache version bump, add some comments and asserts
459 lines
No EOL
17 KiB
C#
459 lines
No EOL
17 KiB
C#
using Ryujinx.Graphics.Shader.Decoders;
|
|
using Ryujinx.Graphics.Shader.IntermediateRepresentation;
|
|
using System.Collections.Generic;
|
|
using System.Diagnostics;
|
|
using System.Numerics;
|
|
using System.Runtime.CompilerServices;
|
|
|
|
using static Ryujinx.Graphics.Shader.IntermediateRepresentation.OperandHelper;
|
|
|
|
namespace Ryujinx.Graphics.Shader.Translation
|
|
{
|
|
class EmitterContext
|
|
{
|
|
public DecodedProgram Program { get; }
|
|
public ShaderConfig Config { get; }
|
|
|
|
public bool IsNonMain { get; }
|
|
|
|
public Block CurrBlock { get; set; }
|
|
public InstOp CurrOp { get; set; }
|
|
|
|
public int OperationsCount => _operations.Count;
|
|
|
|
private struct BrxTarget
|
|
{
|
|
public readonly Operand Selector;
|
|
public readonly int ExpectedValue;
|
|
public readonly ulong NextTargetAddress;
|
|
|
|
public BrxTarget(Operand selector, int expectedValue, ulong nextTargetAddress)
|
|
{
|
|
Selector = selector;
|
|
ExpectedValue = expectedValue;
|
|
NextTargetAddress = nextTargetAddress;
|
|
}
|
|
}
|
|
|
|
private class BlockLabel
|
|
{
|
|
public readonly Operand Label;
|
|
public BrxTarget BrxTarget;
|
|
|
|
public BlockLabel(Operand label)
|
|
{
|
|
Label = label;
|
|
}
|
|
}
|
|
|
|
private readonly List<Operation> _operations;
|
|
private readonly Dictionary<ulong, BlockLabel> _labels;
|
|
|
|
public EmitterContext(DecodedProgram program, ShaderConfig config, bool isNonMain)
|
|
{
|
|
Program = program;
|
|
Config = config;
|
|
IsNonMain = isNonMain;
|
|
_operations = new List<Operation>();
|
|
_labels = new Dictionary<ulong, BlockLabel>();
|
|
|
|
EmitStart();
|
|
}
|
|
|
|
private void EmitStart()
|
|
{
|
|
if (Config.Stage == ShaderStage.Vertex &&
|
|
Config.Options.TargetApi == TargetApi.Vulkan &&
|
|
(Config.Options.Flags & TranslationFlags.VertexA) == 0)
|
|
{
|
|
// Vulkan requires the point size to be always written on the shader if the primitive topology is points.
|
|
this.Copy(Attribute(AttributeConsts.PointSize), ConstF(Config.GpuAccessor.QueryPointSize()));
|
|
}
|
|
}
|
|
|
|
public T GetOp<T>() where T : unmanaged
|
|
{
|
|
Debug.Assert(Unsafe.SizeOf<T>() == sizeof(ulong));
|
|
ulong op = CurrOp.RawOpCode;
|
|
return Unsafe.As<ulong, T>(ref op);
|
|
}
|
|
|
|
public Operand Add(Instruction inst, Operand dest = null, params Operand[] sources)
|
|
{
|
|
Operation operation = new Operation(inst, dest, sources);
|
|
|
|
_operations.Add(operation);
|
|
|
|
return dest;
|
|
}
|
|
|
|
public (Operand, Operand) Add(Instruction inst, (Operand, Operand) dest, params Operand[] sources)
|
|
{
|
|
Operand[] dests = new[] { dest.Item1, dest.Item2 };
|
|
|
|
Operation operation = new Operation(inst, 0, dests, sources);
|
|
|
|
Add(operation);
|
|
|
|
return dest;
|
|
}
|
|
|
|
public void Add(Operation operation)
|
|
{
|
|
_operations.Add(operation);
|
|
}
|
|
|
|
public TextureOperation CreateTextureOperation(
|
|
Instruction inst,
|
|
SamplerType type,
|
|
TextureFlags flags,
|
|
int handle,
|
|
int compIndex,
|
|
Operand dest,
|
|
params Operand[] sources)
|
|
{
|
|
return CreateTextureOperation(inst, type, TextureFormat.Unknown, flags, handle, compIndex, dest, sources);
|
|
}
|
|
|
|
public TextureOperation CreateTextureOperation(
|
|
Instruction inst,
|
|
SamplerType type,
|
|
TextureFormat format,
|
|
TextureFlags flags,
|
|
int handle,
|
|
int compIndex,
|
|
Operand dest,
|
|
params Operand[] sources)
|
|
{
|
|
if (!flags.HasFlag(TextureFlags.Bindless))
|
|
{
|
|
Config.SetUsedTexture(inst, type, format, flags, TextureOperation.DefaultCbufSlot, handle);
|
|
}
|
|
|
|
return new TextureOperation(inst, type, format, flags, handle, compIndex, dest, sources);
|
|
}
|
|
|
|
public void FlagAttributeRead(int attribute)
|
|
{
|
|
if (Config.Stage == ShaderStage.Vertex && attribute == AttributeConsts.InstanceId)
|
|
{
|
|
Config.SetUsedFeature(FeatureFlags.InstanceId);
|
|
}
|
|
else if (Config.Stage == ShaderStage.Fragment)
|
|
{
|
|
switch (attribute)
|
|
{
|
|
case AttributeConsts.PositionX:
|
|
case AttributeConsts.PositionY:
|
|
Config.SetUsedFeature(FeatureFlags.FragCoordXY);
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
|
|
public void FlagAttributeWritten(int attribute)
|
|
{
|
|
if (Config.Stage == ShaderStage.Vertex)
|
|
{
|
|
switch (attribute)
|
|
{
|
|
case AttributeConsts.ClipDistance0:
|
|
case AttributeConsts.ClipDistance1:
|
|
case AttributeConsts.ClipDistance2:
|
|
case AttributeConsts.ClipDistance3:
|
|
case AttributeConsts.ClipDistance4:
|
|
case AttributeConsts.ClipDistance5:
|
|
case AttributeConsts.ClipDistance6:
|
|
case AttributeConsts.ClipDistance7:
|
|
Config.SetClipDistanceWritten((attribute - AttributeConsts.ClipDistance0) / 4);
|
|
break;
|
|
}
|
|
}
|
|
|
|
if (Config.Stage != ShaderStage.Fragment && attribute == AttributeConsts.Layer)
|
|
{
|
|
Config.SetUsedFeature(FeatureFlags.RtLayer);
|
|
}
|
|
}
|
|
|
|
public void MarkLabel(Operand label)
|
|
{
|
|
Add(Instruction.MarkLabel, label);
|
|
}
|
|
|
|
public Operand GetLabel(ulong address)
|
|
{
|
|
return EnsureBlockLabel(address).Label;
|
|
}
|
|
|
|
public void SetBrxTarget(ulong address, Operand selector, int targetValue, ulong nextTargetAddress)
|
|
{
|
|
BlockLabel blockLabel = EnsureBlockLabel(address);
|
|
Debug.Assert(blockLabel.BrxTarget.Selector == null);
|
|
blockLabel.BrxTarget = new BrxTarget(selector, targetValue, nextTargetAddress);
|
|
}
|
|
|
|
public void EnterBlock(ulong address)
|
|
{
|
|
BlockLabel blockLabel = EnsureBlockLabel(address);
|
|
|
|
MarkLabel(blockLabel.Label);
|
|
|
|
BrxTarget brxTarget = blockLabel.BrxTarget;
|
|
|
|
if (brxTarget.Selector != null)
|
|
{
|
|
this.BranchIfFalse(GetLabel(brxTarget.NextTargetAddress), this.ICompareEqual(brxTarget.Selector, Const(brxTarget.ExpectedValue)));
|
|
}
|
|
}
|
|
|
|
private BlockLabel EnsureBlockLabel(ulong address)
|
|
{
|
|
if (!_labels.TryGetValue(address, out BlockLabel blockLabel))
|
|
{
|
|
blockLabel = new BlockLabel(Label());
|
|
|
|
_labels.Add(address, blockLabel);
|
|
}
|
|
|
|
return blockLabel;
|
|
}
|
|
|
|
public void PrepareForVertexReturn()
|
|
{
|
|
if (Config.GpuAccessor.QueryViewportTransformDisable())
|
|
{
|
|
Operand x = Attribute(AttributeConsts.PositionX | AttributeConsts.LoadOutputMask);
|
|
Operand y = Attribute(AttributeConsts.PositionY | AttributeConsts.LoadOutputMask);
|
|
Operand xScale = Attribute(AttributeConsts.SupportBlockViewInverseX);
|
|
Operand yScale = Attribute(AttributeConsts.SupportBlockViewInverseY);
|
|
Operand negativeOne = ConstF(-1.0f);
|
|
|
|
this.Copy(Attribute(AttributeConsts.PositionX), this.FPFusedMultiplyAdd(x, xScale, negativeOne));
|
|
this.Copy(Attribute(AttributeConsts.PositionY), this.FPFusedMultiplyAdd(y, yScale, negativeOne));
|
|
}
|
|
|
|
if (Config.Options.TargetApi == TargetApi.Vulkan && Config.GpuAccessor.QueryTransformDepthMinusOneToOne())
|
|
{
|
|
Operand z = Attribute(AttributeConsts.PositionZ | AttributeConsts.LoadOutputMask);
|
|
Operand w = Attribute(AttributeConsts.PositionW | AttributeConsts.LoadOutputMask);
|
|
Operand halfW = this.FPMultiply(w, ConstF(0.5f));
|
|
|
|
this.Copy(Attribute(AttributeConsts.PositionZ), this.FPFusedMultiplyAdd(z, ConstF(0.5f), halfW));
|
|
}
|
|
}
|
|
|
|
public void PrepareForVertexReturn(out Operand oldXLocal, out Operand oldYLocal, out Operand oldZLocal)
|
|
{
|
|
if (Config.GpuAccessor.QueryViewportTransformDisable())
|
|
{
|
|
oldXLocal = Local();
|
|
this.Copy(oldXLocal, Attribute(AttributeConsts.PositionX | AttributeConsts.LoadOutputMask));
|
|
oldYLocal = Local();
|
|
this.Copy(oldYLocal, Attribute(AttributeConsts.PositionY | AttributeConsts.LoadOutputMask));
|
|
}
|
|
else
|
|
{
|
|
oldXLocal = null;
|
|
oldYLocal = null;
|
|
}
|
|
|
|
if (Config.Options.TargetApi == TargetApi.Vulkan && Config.GpuAccessor.QueryTransformDepthMinusOneToOne())
|
|
{
|
|
oldZLocal = Local();
|
|
this.Copy(oldZLocal, Attribute(AttributeConsts.PositionZ | AttributeConsts.LoadOutputMask));
|
|
}
|
|
else
|
|
{
|
|
oldZLocal = null;
|
|
}
|
|
|
|
PrepareForVertexReturn();
|
|
}
|
|
|
|
public void PrepareForReturn()
|
|
{
|
|
if (IsNonMain)
|
|
{
|
|
return;
|
|
}
|
|
|
|
if (Config.LastInVertexPipeline &&
|
|
(Config.Stage == ShaderStage.Vertex || Config.Stage == ShaderStage.TessellationEvaluation) &&
|
|
(Config.Options.Flags & TranslationFlags.VertexA) == 0)
|
|
{
|
|
PrepareForVertexReturn();
|
|
}
|
|
else if (Config.Stage == ShaderStage.Geometry)
|
|
{
|
|
void WriteOutput(int index, int primIndex)
|
|
{
|
|
Operand x = this.LoadAttribute(Const(index), Const(0), Const(primIndex));
|
|
Operand y = this.LoadAttribute(Const(index + 4), Const(0), Const(primIndex));
|
|
Operand z = this.LoadAttribute(Const(index + 8), Const(0), Const(primIndex));
|
|
Operand w = this.LoadAttribute(Const(index + 12), Const(0), Const(primIndex));
|
|
|
|
this.Copy(Attribute(index), x);
|
|
this.Copy(Attribute(index + 4), y);
|
|
this.Copy(Attribute(index + 8), z);
|
|
this.Copy(Attribute(index + 12), w);
|
|
}
|
|
|
|
if (Config.GpPassthrough && !Config.GpuAccessor.QueryHostSupportsGeometryShaderPassthrough())
|
|
{
|
|
int inputVertices = Config.GpuAccessor.QueryPrimitiveTopology().ToInputVertices();
|
|
|
|
for (int primIndex = 0; primIndex < inputVertices; primIndex++)
|
|
{
|
|
WriteOutput(AttributeConsts.PositionX, primIndex);
|
|
|
|
int passthroughAttributes = Config.PassthroughAttributes;
|
|
while (passthroughAttributes != 0)
|
|
{
|
|
int index = BitOperations.TrailingZeroCount(passthroughAttributes);
|
|
WriteOutput(AttributeConsts.UserAttributeBase + index * 16, primIndex);
|
|
Config.SetOutputUserAttribute(index);
|
|
passthroughAttributes &= ~(1 << index);
|
|
}
|
|
|
|
this.EmitVertex();
|
|
}
|
|
|
|
this.EndPrimitive();
|
|
}
|
|
}
|
|
else if (Config.Stage == ShaderStage.Fragment)
|
|
{
|
|
GenerateAlphaToCoverageDitherDiscard();
|
|
|
|
bool supportsBgra = Config.GpuAccessor.QueryHostSupportsBgraFormat();
|
|
|
|
if (Config.OmapDepth)
|
|
{
|
|
Operand dest = Attribute(AttributeConsts.FragmentOutputDepth);
|
|
|
|
Operand src = Register(Config.GetDepthRegister(), RegisterType.Gpr);
|
|
|
|
this.Copy(dest, src);
|
|
}
|
|
|
|
AlphaTestOp alphaTestOp = Config.GpuAccessor.QueryAlphaTestCompare();
|
|
|
|
if (alphaTestOp != AlphaTestOp.Always && (Config.OmapTargets & 8) != 0)
|
|
{
|
|
if (alphaTestOp == AlphaTestOp.Never)
|
|
{
|
|
this.Discard();
|
|
}
|
|
else
|
|
{
|
|
Instruction comparator = alphaTestOp switch
|
|
{
|
|
AlphaTestOp.Equal => Instruction.CompareEqual,
|
|
AlphaTestOp.Greater => Instruction.CompareGreater,
|
|
AlphaTestOp.GreaterOrEqual => Instruction.CompareGreaterOrEqual,
|
|
AlphaTestOp.Less => Instruction.CompareLess,
|
|
AlphaTestOp.LessOrEqual => Instruction.CompareLessOrEqual,
|
|
AlphaTestOp.NotEqual => Instruction.CompareNotEqual,
|
|
_ => 0
|
|
};
|
|
|
|
Debug.Assert(comparator != 0, $"Invalid alpha test operation \"{alphaTestOp}\".");
|
|
|
|
Operand alpha = Register(3, RegisterType.Gpr);
|
|
Operand alphaRef = ConstF(Config.GpuAccessor.QueryAlphaTestReference());
|
|
Operand alphaPass = Add(Instruction.FP32 | comparator, Local(), alpha, alphaRef);
|
|
Operand alphaPassLabel = Label();
|
|
|
|
this.BranchIfTrue(alphaPassLabel, alphaPass);
|
|
this.Discard();
|
|
this.MarkLabel(alphaPassLabel);
|
|
}
|
|
}
|
|
|
|
int regIndexBase = 0;
|
|
|
|
for (int rtIndex = 0; rtIndex < 8; rtIndex++)
|
|
{
|
|
for (int component = 0; component < 4; component++)
|
|
{
|
|
bool componentEnabled = (Config.OmapTargets & (1 << (rtIndex * 4 + component))) != 0;
|
|
if (!componentEnabled)
|
|
{
|
|
continue;
|
|
}
|
|
|
|
int fragmentOutputColorAttr = AttributeConsts.FragmentOutputColorBase + rtIndex * 16;
|
|
|
|
Operand src = Register(regIndexBase + component, RegisterType.Gpr);
|
|
|
|
// Perform B <-> R swap if needed, for BGRA formats (not supported on OpenGL).
|
|
if (!supportsBgra && (component == 0 || component == 2))
|
|
{
|
|
Operand isBgra = Attribute(AttributeConsts.FragmentOutputIsBgraBase + rtIndex * 4);
|
|
|
|
Operand lblIsBgra = Label();
|
|
Operand lblEnd = Label();
|
|
|
|
this.BranchIfTrue(lblIsBgra, isBgra);
|
|
|
|
this.Copy(Attribute(fragmentOutputColorAttr + component * 4), src);
|
|
this.Branch(lblEnd);
|
|
|
|
MarkLabel(lblIsBgra);
|
|
|
|
this.Copy(Attribute(fragmentOutputColorAttr + (2 - component) * 4), src);
|
|
|
|
MarkLabel(lblEnd);
|
|
}
|
|
else
|
|
{
|
|
this.Copy(Attribute(fragmentOutputColorAttr + component * 4), src);
|
|
}
|
|
}
|
|
|
|
bool targetEnabled = (Config.OmapTargets & (0xf << (rtIndex * 4))) != 0;
|
|
if (targetEnabled)
|
|
{
|
|
Config.SetOutputUserAttribute(rtIndex);
|
|
regIndexBase += 4;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
private void GenerateAlphaToCoverageDitherDiscard()
|
|
{
|
|
// If the feature is disabled, or alpha is not written, then we're done.
|
|
if (!Config.GpuAccessor.QueryAlphaToCoverageDitherEnable() || (Config.OmapTargets & 8) == 0)
|
|
{
|
|
return;
|
|
}
|
|
|
|
// 11 11 11 10 10 10 10 00
|
|
// 11 01 01 01 01 00 00 00
|
|
Operand ditherMask = Const(unchecked((int)0xfbb99110u));
|
|
|
|
Operand x = this.BitwiseAnd(this.FP32ConvertToU32(Attribute(AttributeConsts.PositionX)), Const(1));
|
|
Operand y = this.BitwiseAnd(this.FP32ConvertToU32(Attribute(AttributeConsts.PositionY)), Const(1));
|
|
Operand xy = this.BitwiseOr(x, this.ShiftLeft(y, Const(1)));
|
|
|
|
Operand alpha = Register(3, RegisterType.Gpr);
|
|
Operand scaledAlpha = this.FPMultiply(this.FPSaturate(alpha), ConstF(8));
|
|
Operand quantizedAlpha = this.IMinimumU32(this.FP32ConvertToU32(scaledAlpha), Const(7));
|
|
Operand shift = this.BitwiseOr(this.ShiftLeft(quantizedAlpha, Const(2)), xy);
|
|
Operand opaque = this.BitwiseAnd(this.ShiftRightU32(ditherMask, shift), Const(1));
|
|
|
|
Operand a2cDitherEndLabel = Label();
|
|
|
|
this.BranchIfTrue(a2cDitherEndLabel, opaque);
|
|
this.Discard();
|
|
this.MarkLabel(a2cDitherEndLabel);
|
|
}
|
|
|
|
public Operation[] GetOperations()
|
|
{
|
|
return _operations.ToArray();
|
|
}
|
|
}
|
|
} |