mirror of
https://github.com/GreemDev/Ryujinx.git
synced 2025-01-25 08:12:01 +00:00
7f6b3d234a
* Implement IMUL shader instruction * Implement PCNT/CONT instruction and fix FFMA32I * Add HFMA232I to the table * Shader cache version bump * No Rc on Ffma32i
735 lines
No EOL
26 KiB
C#
735 lines
No EOL
26 KiB
C#
using Ryujinx.Graphics.Shader.Translation;
|
|
using System;
|
|
using System.Collections.Generic;
|
|
using System.Linq;
|
|
using System.Runtime.CompilerServices;
|
|
|
|
using static Ryujinx.Graphics.Shader.IntermediateRepresentation.OperandHelper;
|
|
|
|
namespace Ryujinx.Graphics.Shader.Decoders
|
|
{
|
|
static class Decoder
|
|
{
|
|
public static DecodedProgram Decode(ShaderConfig config, ulong startAddress)
|
|
{
|
|
Queue<DecodedFunction> functionsQueue = new Queue<DecodedFunction>();
|
|
Dictionary<ulong, DecodedFunction> functionsVisited = new Dictionary<ulong, DecodedFunction>();
|
|
|
|
DecodedFunction EnqueueFunction(ulong address)
|
|
{
|
|
if (!functionsVisited.TryGetValue(address, out DecodedFunction function))
|
|
{
|
|
functionsVisited.Add(address, function = new DecodedFunction(address));
|
|
functionsQueue.Enqueue(function);
|
|
}
|
|
|
|
return function;
|
|
}
|
|
|
|
DecodedFunction mainFunction = EnqueueFunction(0);
|
|
|
|
while (functionsQueue.TryDequeue(out DecodedFunction currentFunction))
|
|
{
|
|
List<Block> blocks = new List<Block>();
|
|
Queue<Block> workQueue = new Queue<Block>();
|
|
Dictionary<ulong, Block> visited = new Dictionary<ulong, Block>();
|
|
|
|
Block GetBlock(ulong blkAddress)
|
|
{
|
|
if (!visited.TryGetValue(blkAddress, out Block block))
|
|
{
|
|
block = new Block(blkAddress);
|
|
|
|
workQueue.Enqueue(block);
|
|
visited.Add(blkAddress, block);
|
|
}
|
|
|
|
return block;
|
|
}
|
|
|
|
GetBlock(currentFunction.Address);
|
|
|
|
bool hasNewTarget;
|
|
|
|
do
|
|
{
|
|
while (workQueue.TryDequeue(out Block currBlock))
|
|
{
|
|
// Check if the current block is inside another block.
|
|
if (BinarySearch(blocks, currBlock.Address, out int nBlkIndex))
|
|
{
|
|
Block nBlock = blocks[nBlkIndex];
|
|
|
|
if (nBlock.Address == currBlock.Address)
|
|
{
|
|
throw new InvalidOperationException("Found duplicate block address on the list.");
|
|
}
|
|
|
|
nBlock.Split(currBlock);
|
|
blocks.Insert(nBlkIndex + 1, currBlock);
|
|
|
|
continue;
|
|
}
|
|
|
|
// If we have a block after the current one, set the limit address.
|
|
ulong limitAddress = ulong.MaxValue;
|
|
|
|
if (nBlkIndex != blocks.Count)
|
|
{
|
|
Block nBlock = blocks[nBlkIndex];
|
|
|
|
int nextIndex = nBlkIndex + 1;
|
|
|
|
if (nBlock.Address < currBlock.Address && nextIndex < blocks.Count)
|
|
{
|
|
limitAddress = blocks[nextIndex].Address;
|
|
}
|
|
else if (nBlock.Address > currBlock.Address)
|
|
{
|
|
limitAddress = blocks[nBlkIndex].Address;
|
|
}
|
|
}
|
|
|
|
FillBlock(config, currBlock, limitAddress, startAddress);
|
|
|
|
if (currBlock.OpCodes.Count != 0)
|
|
{
|
|
// We should have blocks for all possible branch targets,
|
|
// including those from PBK/PCNT/SSY instructions.
|
|
foreach (PushOpInfo pushOp in currBlock.PushOpCodes)
|
|
{
|
|
GetBlock(pushOp.Op.GetAbsoluteAddress());
|
|
}
|
|
|
|
// Set child blocks. "Branch" is the block the branch instruction
|
|
// points to (when taken), "Next" is the block at the next address,
|
|
// executed when the branch is not taken. For Unconditional Branches
|
|
// or end of program, Next is null.
|
|
InstOp lastOp = currBlock.GetLastOp();
|
|
|
|
if (lastOp.Name == InstName.Cal)
|
|
{
|
|
EnqueueFunction(lastOp.GetAbsoluteAddress()).AddCaller(currentFunction);
|
|
}
|
|
else if (lastOp.Name == InstName.Bra)
|
|
{
|
|
Block succBlock = GetBlock(lastOp.GetAbsoluteAddress());
|
|
currBlock.Successors.Add(succBlock);
|
|
succBlock.Predecessors.Add(currBlock);
|
|
}
|
|
|
|
if (!IsUnconditionalBranch(ref lastOp))
|
|
{
|
|
Block succBlock = GetBlock(currBlock.EndAddress);
|
|
currBlock.Successors.Insert(0, succBlock);
|
|
succBlock.Predecessors.Add(currBlock);
|
|
}
|
|
}
|
|
|
|
// Insert the new block on the list (sorted by address).
|
|
if (blocks.Count != 0)
|
|
{
|
|
Block nBlock = blocks[nBlkIndex];
|
|
|
|
blocks.Insert(nBlkIndex + (nBlock.Address < currBlock.Address ? 1 : 0), currBlock);
|
|
}
|
|
else
|
|
{
|
|
blocks.Add(currBlock);
|
|
}
|
|
}
|
|
|
|
// Propagate SSY/PBK addresses into their uses (SYNC/BRK).
|
|
foreach (Block block in blocks.Where(x => x.PushOpCodes.Count != 0))
|
|
{
|
|
for (int pushOpIndex = 0; pushOpIndex < block.PushOpCodes.Count; pushOpIndex++)
|
|
{
|
|
PropagatePushOp(visited, block, pushOpIndex);
|
|
}
|
|
}
|
|
|
|
// Try to find targets for BRX (indirect branch) instructions.
|
|
hasNewTarget = FindBrxTargets(config, blocks, GetBlock);
|
|
|
|
// If we discovered new branch targets from the BRX instruction,
|
|
// we need another round of decoding to decode the new blocks.
|
|
// Additionally, we may have more SSY/PBK targets to propagate,
|
|
// and new BRX instructions.
|
|
}
|
|
while (hasNewTarget);
|
|
|
|
currentFunction.SetBlocks(blocks.ToArray());
|
|
}
|
|
|
|
return new DecodedProgram(mainFunction, functionsVisited);
|
|
}
|
|
|
|
private static bool BinarySearch(List<Block> blocks, ulong address, out int index)
|
|
{
|
|
index = 0;
|
|
|
|
int left = 0;
|
|
int right = blocks.Count - 1;
|
|
|
|
while (left <= right)
|
|
{
|
|
int size = right - left;
|
|
|
|
int middle = left + (size >> 1);
|
|
|
|
Block block = blocks[middle];
|
|
|
|
index = middle;
|
|
|
|
if (address >= block.Address && address < block.EndAddress)
|
|
{
|
|
return true;
|
|
}
|
|
|
|
if (address < block.Address)
|
|
{
|
|
right = middle - 1;
|
|
}
|
|
else
|
|
{
|
|
left = middle + 1;
|
|
}
|
|
}
|
|
|
|
return false;
|
|
}
|
|
|
|
private static void FillBlock(ShaderConfig config, Block block, ulong limitAddress, ulong startAddress)
|
|
{
|
|
IGpuAccessor gpuAccessor = config.GpuAccessor;
|
|
|
|
ulong address = block.Address;
|
|
int bufferOffset = 0;
|
|
ReadOnlySpan<ulong> buffer = ReadOnlySpan<ulong>.Empty;
|
|
|
|
InstOp op = default;
|
|
|
|
do
|
|
{
|
|
if (address + 7 >= limitAddress)
|
|
{
|
|
break;
|
|
}
|
|
|
|
// Ignore scheduling instructions, which are written every 32 bytes.
|
|
if ((address & 0x1f) == 0)
|
|
{
|
|
address += 8;
|
|
bufferOffset++;
|
|
continue;
|
|
}
|
|
|
|
if (bufferOffset >= buffer.Length)
|
|
{
|
|
buffer = gpuAccessor.GetCode(startAddress + address, 8);
|
|
bufferOffset = 0;
|
|
}
|
|
|
|
ulong opCode = buffer[bufferOffset++];
|
|
|
|
op = InstTable.GetOp(address, opCode);
|
|
|
|
if (op.Props.HasFlag(InstProps.TexB))
|
|
{
|
|
config.SetUsedFeature(FeatureFlags.Bindless);
|
|
}
|
|
|
|
if (op.Name == InstName.Ald || op.Name == InstName.Ast || op.Name == InstName.Ipa)
|
|
{
|
|
SetUserAttributeUses(config, op.Name, opCode);
|
|
}
|
|
else if (op.Name == InstName.Pbk || op.Name == InstName.Pcnt || op.Name == InstName.Ssy)
|
|
{
|
|
block.AddPushOp(op);
|
|
}
|
|
|
|
block.OpCodes.Add(op);
|
|
|
|
address += 8;
|
|
}
|
|
while (!op.Props.HasFlag(InstProps.Bra));
|
|
|
|
block.EndAddress = address;
|
|
}
|
|
|
|
private static void SetUserAttributeUses(ShaderConfig config, InstName name, ulong opCode)
|
|
{
|
|
int offset;
|
|
int count = 1;
|
|
bool isStore = false;
|
|
bool indexed = false;
|
|
bool perPatch = false;
|
|
|
|
if (name == InstName.Ast)
|
|
{
|
|
InstAst opAst = new InstAst(opCode);
|
|
count = (int)opAst.AlSize + 1;
|
|
offset = opAst.Imm11;
|
|
indexed = opAst.Phys;
|
|
perPatch = opAst.P;
|
|
isStore = true;
|
|
}
|
|
else if (name == InstName.Ald)
|
|
{
|
|
InstAld opAld = new InstAld(opCode);
|
|
count = (int)opAld.AlSize + 1;
|
|
offset = opAld.Imm11;
|
|
indexed = opAld.Phys;
|
|
perPatch = opAld.P;
|
|
isStore = opAld.O;
|
|
}
|
|
else /* if (name == InstName.Ipa) */
|
|
{
|
|
InstIpa opIpa = new InstIpa(opCode);
|
|
offset = opIpa.Imm10;
|
|
indexed = opIpa.Idx;
|
|
}
|
|
|
|
if (indexed)
|
|
{
|
|
if (isStore)
|
|
{
|
|
config.SetAllOutputUserAttributes();
|
|
}
|
|
else
|
|
{
|
|
config.SetAllInputUserAttributes();
|
|
}
|
|
}
|
|
else
|
|
{
|
|
for (int elemIndex = 0; elemIndex < count; elemIndex++)
|
|
{
|
|
int attr = offset + elemIndex * 4;
|
|
if (attr >= AttributeConsts.UserAttributeBase && attr < AttributeConsts.UserAttributeEnd)
|
|
{
|
|
int index = (attr - AttributeConsts.UserAttributeBase) / 16;
|
|
|
|
if (isStore)
|
|
{
|
|
config.SetOutputUserAttribute(index, perPatch);
|
|
}
|
|
else
|
|
{
|
|
config.SetInputUserAttribute(index, perPatch);
|
|
}
|
|
}
|
|
|
|
if (!isStore &&
|
|
((attr >= AttributeConsts.FrontColorDiffuseR && attr < AttributeConsts.ClipDistance0) ||
|
|
(attr >= AttributeConsts.TexCoordBase && attr < AttributeConsts.TexCoordEnd)))
|
|
{
|
|
config.SetUsedFeature(FeatureFlags.FixedFuncAttr);
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
public static bool IsUnconditionalBranch(ref InstOp op)
|
|
{
|
|
return IsUnconditional(ref op) && op.Props.HasFlag(InstProps.Bra);
|
|
}
|
|
|
|
private static bool IsUnconditional(ref InstOp op)
|
|
{
|
|
InstConditional condOp = new InstConditional(op.RawOpCode);
|
|
|
|
if (op.Name == InstName.Exit && condOp.Ccc != Ccc.T)
|
|
{
|
|
return false;
|
|
}
|
|
|
|
return condOp.Pred == RegisterConsts.PredicateTrueIndex && !condOp.PredInv;
|
|
}
|
|
|
|
private static bool FindBrxTargets(ShaderConfig config, IEnumerable<Block> blocks, Func<ulong, Block> getBlock)
|
|
{
|
|
bool hasNewTarget = false;
|
|
|
|
foreach (Block block in blocks)
|
|
{
|
|
InstOp lastOp = block.GetLastOp();
|
|
bool hasNext = block.HasNext();
|
|
|
|
if (lastOp.Name == InstName.Brx && block.Successors.Count == (hasNext ? 1 : 0))
|
|
{
|
|
InstBrx opBrx = new InstBrx(lastOp.RawOpCode);
|
|
ulong baseOffset = lastOp.GetAbsoluteAddress();
|
|
|
|
// An indirect branch could go anywhere,
|
|
// try to get the possible target offsets from the constant buffer.
|
|
(int cbBaseOffset, int cbOffsetsCount) = FindBrxTargetRange(block, opBrx.SrcA);
|
|
|
|
if (cbOffsetsCount != 0)
|
|
{
|
|
hasNewTarget = true;
|
|
}
|
|
|
|
for (int i = 0; i < cbOffsetsCount; i++)
|
|
{
|
|
uint targetOffset = config.GpuAccessor.ConstantBuffer1Read(cbBaseOffset + i * 4);
|
|
Block target = getBlock(baseOffset + targetOffset);
|
|
target.Predecessors.Add(block);
|
|
block.Successors.Add(target);
|
|
}
|
|
}
|
|
}
|
|
|
|
return hasNewTarget;
|
|
}
|
|
|
|
private static (int, int) FindBrxTargetRange(Block block, int brxReg)
|
|
{
|
|
// Try to match the following pattern:
|
|
//
|
|
// IMNMX.U32 Rx, Rx, UpperBound, PT
|
|
// SHL Rx, Rx, 0x2
|
|
// LDC Rx, c[0x1][Rx+BaseOffset]
|
|
//
|
|
// Here, Rx is an arbitrary register, "UpperBound" and "BaseOffset" are constants.
|
|
// The above pattern is assumed to be generated by the compiler before BRX,
|
|
// as the instruction is usually used to implement jump tables for switch statement optimizations.
|
|
// On a successful match, "BaseOffset" is the offset in bytes where the jump offsets are
|
|
// located on the constant buffer, and "UpperBound" is the total number of offsets for the BRX, minus 1.
|
|
|
|
HashSet<Block> visited = new HashSet<Block>();
|
|
|
|
var ldcLocation = FindFirstRegWrite(visited, new BlockLocation(block, block.OpCodes.Count - 1), brxReg);
|
|
if (ldcLocation.Block == null || ldcLocation.Block.OpCodes[ldcLocation.Index].Name != InstName.Ldc)
|
|
{
|
|
return (0, 0);
|
|
}
|
|
|
|
GetOp<InstLdc>(ldcLocation, out var opLdc);
|
|
|
|
if (opLdc.CbufSlot != 1 || opLdc.AddressMode != 0)
|
|
{
|
|
return (0, 0);
|
|
}
|
|
|
|
var shlLocation = FindFirstRegWrite(visited, ldcLocation, opLdc.SrcA);
|
|
if (shlLocation.Block == null || !shlLocation.IsImmInst(InstName.Shl))
|
|
{
|
|
return (0, 0);
|
|
}
|
|
|
|
GetOp<InstShlI>(shlLocation, out var opShl);
|
|
|
|
if (opShl.Imm20 != 2)
|
|
{
|
|
return (0, 0);
|
|
}
|
|
|
|
var imnmxLocation = FindFirstRegWrite(visited, shlLocation, opShl.SrcA);
|
|
if (imnmxLocation.Block == null || !imnmxLocation.IsImmInst(InstName.Imnmx))
|
|
{
|
|
return (0, 0);
|
|
}
|
|
|
|
GetOp<InstImnmxI>(imnmxLocation, out var opImnmx);
|
|
|
|
if (opImnmx.Signed || opImnmx.SrcPred != RegisterConsts.PredicateTrueIndex || opImnmx.SrcPredInv)
|
|
{
|
|
return (0, 0);
|
|
}
|
|
|
|
return (opLdc.CbufOffset, opImnmx.Imm20 + 1);
|
|
}
|
|
|
|
private static void GetOp<T>(BlockLocation location, out T op) where T : unmanaged
|
|
{
|
|
ulong rawOp = location.Block.OpCodes[location.Index].RawOpCode;
|
|
op = Unsafe.As<ulong, T>(ref rawOp);
|
|
}
|
|
|
|
private struct BlockLocation
|
|
{
|
|
public Block Block { get; }
|
|
public int Index { get; }
|
|
|
|
public BlockLocation(Block block, int index)
|
|
{
|
|
Block = block;
|
|
Index = index;
|
|
}
|
|
|
|
public bool IsImmInst(InstName name)
|
|
{
|
|
InstOp op = Block.OpCodes[Index];
|
|
return op.Name == name && op.Props.HasFlag(InstProps.Ib);
|
|
}
|
|
}
|
|
|
|
private static BlockLocation FindFirstRegWrite(HashSet<Block> visited, BlockLocation location, int regIndex)
|
|
{
|
|
Queue<BlockLocation> toVisit = new Queue<BlockLocation>();
|
|
toVisit.Enqueue(location);
|
|
visited.Add(location.Block);
|
|
|
|
while (toVisit.TryDequeue(out var currentLocation))
|
|
{
|
|
Block block = currentLocation.Block;
|
|
for (int i = currentLocation.Index - 1; i >= 0; i--)
|
|
{
|
|
if (WritesToRegister(block.OpCodes[i], regIndex))
|
|
{
|
|
return new BlockLocation(block, i);
|
|
}
|
|
}
|
|
|
|
foreach (Block predecessor in block.Predecessors)
|
|
{
|
|
if (visited.Add(predecessor))
|
|
{
|
|
toVisit.Enqueue(new BlockLocation(predecessor, predecessor.OpCodes.Count));
|
|
}
|
|
}
|
|
}
|
|
|
|
return new BlockLocation(null, 0);
|
|
}
|
|
|
|
private static bool WritesToRegister(InstOp op, int regIndex)
|
|
{
|
|
// Predicate instruction only ever writes to predicate, so we shouldn't check those.
|
|
if ((op.Props & (InstProps.Rd | InstProps.Rd2)) == 0)
|
|
{
|
|
return false;
|
|
}
|
|
|
|
if (op.Props.HasFlag(InstProps.Rd2) && (byte)(op.RawOpCode >> 28) == regIndex)
|
|
{
|
|
return true;
|
|
}
|
|
|
|
return (byte)op.RawOpCode == regIndex;
|
|
}
|
|
|
|
private enum MergeType
|
|
{
|
|
Brk,
|
|
Cont,
|
|
Sync
|
|
}
|
|
|
|
private struct PathBlockState
|
|
{
|
|
public Block Block { get; }
|
|
|
|
private enum RestoreType
|
|
{
|
|
None,
|
|
PopPushOp,
|
|
PushBranchOp
|
|
}
|
|
|
|
private RestoreType _restoreType;
|
|
|
|
private ulong _restoreValue;
|
|
private MergeType _restoreMergeType;
|
|
|
|
public bool ReturningFromVisit => _restoreType != RestoreType.None;
|
|
|
|
public PathBlockState(Block block)
|
|
{
|
|
Block = block;
|
|
_restoreType = RestoreType.None;
|
|
_restoreValue = 0;
|
|
_restoreMergeType = default;
|
|
}
|
|
|
|
public PathBlockState(int oldStackSize)
|
|
{
|
|
Block = null;
|
|
_restoreType = RestoreType.PopPushOp;
|
|
_restoreValue = (ulong)oldStackSize;
|
|
_restoreMergeType = default;
|
|
}
|
|
|
|
public PathBlockState(ulong syncAddress, MergeType mergeType)
|
|
{
|
|
Block = null;
|
|
_restoreType = RestoreType.PushBranchOp;
|
|
_restoreValue = syncAddress;
|
|
_restoreMergeType = mergeType;
|
|
}
|
|
|
|
public void RestoreStackState(Stack<(ulong, MergeType)> branchStack)
|
|
{
|
|
if (_restoreType == RestoreType.PushBranchOp)
|
|
{
|
|
branchStack.Push((_restoreValue, _restoreMergeType));
|
|
}
|
|
else if (_restoreType == RestoreType.PopPushOp)
|
|
{
|
|
while (branchStack.Count > (uint)_restoreValue)
|
|
{
|
|
branchStack.Pop();
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
private static void PropagatePushOp(Dictionary<ulong, Block> blocks, Block currBlock, int pushOpIndex)
|
|
{
|
|
PushOpInfo pushOpInfo = currBlock.PushOpCodes[pushOpIndex];
|
|
InstOp pushOp = pushOpInfo.Op;
|
|
|
|
Block target = blocks[pushOp.GetAbsoluteAddress()];
|
|
|
|
Stack<PathBlockState> workQueue = new Stack<PathBlockState>();
|
|
HashSet<Block> visited = new HashSet<Block>();
|
|
Stack<(ulong, MergeType)> branchStack = new Stack<(ulong, MergeType)>();
|
|
|
|
void Push(PathBlockState pbs)
|
|
{
|
|
// When block is null, this means we are pushing a restore operation.
|
|
// Restore operations are used to undo the work done inside a block
|
|
// when we return from it, for example it pops addresses pushed by
|
|
// SSY/PBK instructions inside the block, and pushes addresses poped
|
|
// by SYNC/BRK.
|
|
// For blocks, if it's already visited, we just ignore to avoid going
|
|
// around in circles and getting stuck here.
|
|
if (pbs.Block == null || !visited.Contains(pbs.Block))
|
|
{
|
|
workQueue.Push(pbs);
|
|
}
|
|
}
|
|
|
|
Push(new PathBlockState(currBlock));
|
|
|
|
while (workQueue.TryPop(out PathBlockState pbs))
|
|
{
|
|
if (pbs.ReturningFromVisit)
|
|
{
|
|
pbs.RestoreStackState(branchStack);
|
|
|
|
continue;
|
|
}
|
|
|
|
Block current = pbs.Block;
|
|
|
|
// If the block was already processed, we just ignore it, otherwise
|
|
// we would push the same child blocks of an already processed block,
|
|
// and go around in circles until memory is exhausted.
|
|
if (!visited.Add(current))
|
|
{
|
|
continue;
|
|
}
|
|
|
|
int pushOpsCount = current.PushOpCodes.Count;
|
|
if (pushOpsCount != 0)
|
|
{
|
|
Push(new PathBlockState(branchStack.Count));
|
|
|
|
for (int index = pushOpIndex; index < pushOpsCount; index++)
|
|
{
|
|
InstOp currentPushOp = current.PushOpCodes[index].Op;
|
|
MergeType pushMergeType = GetMergeTypeFromPush(currentPushOp.Name);
|
|
branchStack.Push((currentPushOp.GetAbsoluteAddress(), pushMergeType));
|
|
}
|
|
}
|
|
|
|
pushOpIndex = 0;
|
|
|
|
bool hasNext = current.HasNext();
|
|
if (hasNext)
|
|
{
|
|
Push(new PathBlockState(current.Successors[0]));
|
|
}
|
|
|
|
InstOp lastOp = current.GetLastOp();
|
|
if (IsPopBranch(lastOp.Name))
|
|
{
|
|
MergeType popMergeType = GetMergeTypeFromPop(lastOp.Name);
|
|
|
|
bool found = true;
|
|
ulong targetAddress = 0UL;
|
|
MergeType mergeType;
|
|
|
|
do
|
|
{
|
|
if (branchStack.Count == 0)
|
|
{
|
|
found = false;
|
|
break;
|
|
}
|
|
|
|
(targetAddress, mergeType) = branchStack.Pop();
|
|
|
|
// Push the target address (this will be used to push the address
|
|
// back into the PBK/PCNT/SSY stack when we return from that block),
|
|
Push(new PathBlockState(targetAddress, mergeType));
|
|
}
|
|
while (mergeType != popMergeType);
|
|
|
|
// Make sure we found the correct address,
|
|
// the push and pop instruction types must match, so:
|
|
// - BRK can only consume addresses pushed by PBK.
|
|
// - SYNC can only consume addresses pushed by SSY.
|
|
if (found)
|
|
{
|
|
if (branchStack.Count == 0)
|
|
{
|
|
// If the entire stack was consumed, then the current pop instruction
|
|
// just consumed the address from our push instruction.
|
|
if (current.SyncTargets.TryAdd(pushOp.Address, new SyncTarget(pushOpInfo, current.SyncTargets.Count)))
|
|
{
|
|
pushOpInfo.Consumers.Add(current, Local());
|
|
target.Predecessors.Add(current);
|
|
current.Successors.Add(target);
|
|
}
|
|
}
|
|
else
|
|
{
|
|
// Push the block itself into the work queue for processing.
|
|
Push(new PathBlockState(blocks[targetAddress]));
|
|
}
|
|
}
|
|
}
|
|
else
|
|
{
|
|
// By adding them in descending order (sorted by address), we process the blocks
|
|
// in order (of ascending address), since we work with a LIFO.
|
|
foreach (Block possibleTarget in current.Successors.OrderByDescending(x => x.Address))
|
|
{
|
|
if (!hasNext || possibleTarget != current.Successors[0])
|
|
{
|
|
Push(new PathBlockState(possibleTarget));
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
public static bool IsPopBranch(InstName name)
|
|
{
|
|
return name == InstName.Brk || name == InstName.Cont || name == InstName.Sync;
|
|
}
|
|
|
|
private static MergeType GetMergeTypeFromPush(InstName name)
|
|
{
|
|
return name switch
|
|
{
|
|
InstName.Pbk => MergeType.Brk,
|
|
InstName.Pcnt => MergeType.Cont,
|
|
_ => MergeType.Sync
|
|
};
|
|
}
|
|
|
|
private static MergeType GetMergeTypeFromPop(InstName name)
|
|
{
|
|
return name switch
|
|
{
|
|
InstName.Brk => MergeType.Brk,
|
|
InstName.Cont => MergeType.Cont,
|
|
_ => MergeType.Sync
|
|
};
|
|
}
|
|
}
|
|
} |