mirror of https://github.com/icsharpcode/ILSpy.git
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
511 lines
17 KiB
511 lines
17 KiB
using System; |
|
using System.Collections.Generic; |
|
using System.Linq; |
|
using ICSharpCode.Decompiler.FlowAnalysis; |
|
using Mono.Cecil; |
|
using Mono.Cecil.Cil; |
|
using Decompiler.Rocks; |
|
|
|
namespace Decompiler.ControlFlow |
|
{ |
|
public class ILAstOptimizer |
|
{ |
|
Dictionary<ILLabel, ControlFlowNode> labelToCfNode = new Dictionary<ILLabel, ControlFlowNode>(); |
|
|
|
public void Optimize(ILBlock method) |
|
{ |
|
foreach(ILBlock block in method.GetSelfAndChildrenRecursive<ILBlock>().ToList()) { |
|
SplitToMovableBlocks(block); |
|
} |
|
|
|
foreach(ILBlock block in method.GetSelfAndChildrenRecursive<ILBlock>().Where(b => !(b is ILMoveableBlock)).ToList()) { |
|
ControlFlowGraph graph; |
|
graph = BuildGraph(block.Body, block.EntryPoint); |
|
graph.ComputeDominance(); |
|
graph.ComputeDominanceFrontier(); |
|
block.Body = FindLoops(new HashSet<ControlFlowNode>(graph.Nodes.Skip(3)), graph.EntryPoint, true); |
|
} |
|
|
|
foreach(ILBlock block in method.GetSelfAndChildrenRecursive<ILBlock>().Where(b => !(b is ILMoveableBlock)).ToList()) { |
|
ControlFlowGraph graph; |
|
graph = BuildGraph(block.Body, block.EntryPoint); |
|
graph.ComputeDominance(); |
|
graph.ComputeDominanceFrontier(); |
|
block.Body = FindConditions(new HashSet<ControlFlowNode>(graph.Nodes.Skip(3)), graph.EntryPoint); |
|
} |
|
|
|
// OrderNodes(method); |
|
FlattenNestedMovableBlocks(method); |
|
SimpleGotoRemoval(method); |
|
RemoveDeadLabels(method); |
|
} |
|
|
|
class ILMoveableBlock: ILBlock |
|
{ |
|
public int OriginalOrder; |
|
} |
|
|
|
int nextBlockIndex = 0; |
|
|
|
/// <summary> |
|
/// Group input into a set of blocks that can be later arbitraliby schufled. |
|
/// The method adds necessary branches to make control flow between blocks |
|
/// explicit and thus order independent. |
|
/// </summary> |
|
void SplitToMovableBlocks(ILBlock block) |
|
{ |
|
// Remve no-ops |
|
// TODO: Assign the no-op range to someting |
|
block.Body = block.Body.Where(n => !(n is ILExpression && ((ILExpression)n).OpCode == OpCodes.Nop)).ToList(); |
|
|
|
List<ILNode> moveableBlocks = new List<ILNode>(); |
|
|
|
ILMoveableBlock moveableBlock = new ILMoveableBlock() { OriginalOrder = (nextBlockIndex++) }; |
|
moveableBlocks.Add(moveableBlock); |
|
block.EntryPoint = new ILLabel() { Name = "Block_" + moveableBlock.OriginalOrder }; |
|
moveableBlock.Body.Add(block.EntryPoint); |
|
|
|
if (block.Body.Count > 0) { |
|
moveableBlock.Body.Add(block.Body[0]); |
|
|
|
for (int i = 1; i < block.Body.Count; i++) { |
|
ILNode lastNode = block.Body[i - 1]; |
|
ILNode currNode = block.Body[i]; |
|
|
|
// Insert split |
|
if ((currNode is ILLabel && !(lastNode is ILLabel)) || |
|
lastNode is ILTryCatchBlock || |
|
currNode is ILTryCatchBlock || |
|
(lastNode is ILExpression) && ((ILExpression)lastNode).OpCode.IsBranch() || |
|
(currNode is ILExpression) && ((ILExpression)currNode).OpCode.IsBranch()) |
|
{ |
|
ILBlock lastBlock = moveableBlock; |
|
moveableBlock = new ILMoveableBlock() { OriginalOrder = (nextBlockIndex++) }; |
|
moveableBlocks.Add(moveableBlock); |
|
|
|
// Explicit branch from one block to other |
|
// (unless the last expression was unconditional branch) |
|
if (!(lastNode is ILExpression) || ((ILExpression)lastNode).OpCode.CanFallThough()) { |
|
ILLabel blockLabel = new ILLabel() { Name = "Block_" + moveableBlock.OriginalOrder }; |
|
lastBlock.Body.Add(new ILExpression(OpCodes.Br, blockLabel)); |
|
moveableBlock.Body.Add(blockLabel); |
|
} |
|
} |
|
|
|
moveableBlock.Body.Add(currNode); |
|
} |
|
} |
|
|
|
block.Body = moveableBlocks; |
|
return; |
|
} |
|
|
|
ControlFlowGraph BuildGraph(List<ILNode> nodes, ILLabel entryLabel) |
|
{ |
|
int index = 0; |
|
List<ControlFlowNode> cfNodes = new List<ControlFlowNode>(); |
|
ControlFlowNode entryPoint = new ControlFlowNode(index++, 0, ControlFlowNodeType.EntryPoint); |
|
cfNodes.Add(entryPoint); |
|
ControlFlowNode regularExit = new ControlFlowNode(index++, -1, ControlFlowNodeType.RegularExit); |
|
cfNodes.Add(regularExit); |
|
ControlFlowNode exceptionalExit = new ControlFlowNode(index++, -1, ControlFlowNodeType.ExceptionalExit); |
|
cfNodes.Add(exceptionalExit); |
|
|
|
// Create graph nodes |
|
labelToCfNode = new Dictionary<ILLabel, ControlFlowNode>(); |
|
Dictionary<ILNode, ControlFlowNode> astNodeToCfNode = new Dictionary<ILNode, ControlFlowNode>(); |
|
foreach(ILNode node in nodes) { |
|
ControlFlowNode cfNode = new ControlFlowNode(index++, -1, ControlFlowNodeType.Normal); |
|
cfNodes.Add(cfNode); |
|
astNodeToCfNode[node] = cfNode; |
|
cfNode.UserData = node; |
|
|
|
// Find all contained labels |
|
foreach(ILLabel label in node.GetSelfAndChildrenRecursive<ILLabel>()) { |
|
labelToCfNode[label] = cfNode; |
|
} |
|
} |
|
|
|
// Entry endge |
|
ControlFlowNode entryNode = labelToCfNode[entryLabel]; |
|
ControlFlowEdge entryEdge = new ControlFlowEdge(entryPoint, entryNode, JumpType.Normal); |
|
entryPoint.Outgoing.Add(entryEdge); |
|
entryNode.Incoming.Add(entryEdge); |
|
|
|
// Create edges |
|
foreach(ILNode node in nodes) { |
|
ControlFlowNode source = astNodeToCfNode[node]; |
|
|
|
// Find all branches |
|
foreach(ILExpression child in node.GetSelfAndChildrenRecursive<ILExpression>()) { |
|
IEnumerable<ILLabel> targets = child.GetBranchTargets(); |
|
if (targets != null) { |
|
foreach(ILLabel target in targets) { |
|
ControlFlowNode destination; |
|
// Labels which are out of out scope will not be int the collection |
|
if (labelToCfNode.TryGetValue(target, out destination) && destination != source) { |
|
ControlFlowEdge edge = new ControlFlowEdge(source, destination, JumpType.Normal); |
|
source.Outgoing.Add(edge); |
|
destination.Incoming.Add(edge); |
|
} |
|
} |
|
} |
|
} |
|
} |
|
|
|
return new ControlFlowGraph(cfNodes.ToArray()); |
|
} |
|
|
|
List<ILNode> FindLoops(HashSet<ControlFlowNode> nodes, ControlFlowNode entryPoint, bool excludeEntryPoint) |
|
{ |
|
List<ILNode> result = new List<ILNode>(); |
|
|
|
Queue<ControlFlowNode> agenda = new Queue<ControlFlowNode>(); |
|
agenda.Enqueue(entryPoint); |
|
while(agenda.Count > 0) { |
|
ControlFlowNode node = agenda.Dequeue(); |
|
|
|
if (nodes.Contains(node) |
|
&& node.DominanceFrontier.Contains(node) |
|
&& (node != entryPoint || !excludeEntryPoint)) |
|
{ |
|
HashSet<ControlFlowNode> loopContents = new HashSet<ControlFlowNode>(); |
|
FindLoopContents(nodes, loopContents, node, node); |
|
|
|
// Move the content into loop block |
|
nodes.ExceptWith(loopContents); |
|
ILLabel entryLabel = new ILLabel() { Name = "Loop_" + (nextBlockIndex++) }; |
|
((ILBlock)node.UserData).Body.Insert(0, entryLabel); |
|
result.Add(new ILLoop() { ContentBlock = new ILBlock(FindLoops(loopContents, node, true)) { EntryPoint = entryLabel } }); |
|
} |
|
|
|
// Using the dominator tree should ensure we find the the widest loop first |
|
foreach(var child in node.DominatorTreeChildren) { |
|
agenda.Enqueue(child); |
|
} |
|
} |
|
|
|
// Add whatever is left |
|
foreach(var node in nodes) { |
|
result.Add((ILNode)node.UserData); |
|
} |
|
|
|
return result; |
|
} |
|
|
|
static void FindLoopContents(HashSet<ControlFlowNode> nodes, HashSet<ControlFlowNode> loopContents, ControlFlowNode loopHead, ControlFlowNode addNode) |
|
{ |
|
if (nodes.Contains(addNode) && loopHead.Dominates(addNode) && loopContents.Add(addNode)) { |
|
foreach (var edge in addNode.Incoming) { |
|
FindLoopContents(nodes, loopContents, loopHead, edge.Source); |
|
} |
|
} |
|
} |
|
|
|
List<ILNode> FindConditions(HashSet<ControlFlowNode> nodes, ControlFlowNode entryNode) |
|
{ |
|
List<ILNode> result = new List<ILNode>(); |
|
|
|
Queue<ControlFlowNode> agenda = new Queue<ControlFlowNode>(); |
|
agenda.Enqueue(entryNode); |
|
while(agenda.Count > 0) { |
|
ControlFlowNode node = agenda.Dequeue(); |
|
|
|
// Find a block that represents a simple condition |
|
if (nodes.Contains(node)) { |
|
|
|
ILMoveableBlock block = node.UserData as ILMoveableBlock; |
|
|
|
if (block != null && block.Body.Count == 3) { |
|
|
|
ILLabel label = block.Body[0] as ILLabel; |
|
ILExpression condBranch = block.Body[1] as ILExpression; |
|
ILExpression statBranch = block.Body[2] as ILExpression; |
|
|
|
// Switch |
|
if (label != null && |
|
condBranch != null && condBranch.Operand is ILLabel[] && condBranch.Arguments.Count > 0 && |
|
statBranch != null && statBranch.Operand is ILLabel && statBranch.Arguments.Count == 0) |
|
{ |
|
ILSwitch ilSwitch = new ILSwitch() { Condition = condBranch }; |
|
|
|
// Replace the two branches with a conditional structure - this preserves the node label |
|
block.Body.Remove(condBranch); |
|
block.Body.Remove(statBranch); |
|
block.Body.Add(ilSwitch); |
|
|
|
ControlFlowNode statTarget = null; |
|
labelToCfNode.TryGetValue((ILLabel)statBranch.Operand, out statTarget); |
|
|
|
// Pull in the conditional code |
|
HashSet<ControlFlowNode> frontiers = new HashSet<ControlFlowNode>(); |
|
|
|
if (statTarget != null) |
|
frontiers.UnionWith(statTarget.DominanceFrontier); |
|
|
|
foreach(ILLabel condLabel in (ILLabel[])condBranch.Operand) { |
|
ControlFlowNode condTarget = null; |
|
labelToCfNode.TryGetValue(condLabel, out condTarget); |
|
|
|
if (condTarget != null) |
|
frontiers.UnionWith(condTarget.DominanceFrontier); |
|
} |
|
|
|
foreach(ILLabel condLabel in (ILLabel[])condBranch.Operand) { |
|
ControlFlowNode condTarget = null; |
|
labelToCfNode.TryGetValue(condLabel, out condTarget); |
|
|
|
ILBlock caseBlock = new ILBlock() { EntryPoint = condLabel }; |
|
if (condTarget != null && !frontiers.Contains(condTarget)) { |
|
HashSet<ControlFlowNode> content = FindDominatedNodes(nodes, condTarget); |
|
nodes.ExceptWith(content); |
|
caseBlock.Body.AddRange(FindConditions(content, condTarget)); |
|
} |
|
ilSwitch.CaseBlocks.Add(caseBlock); |
|
} |
|
|
|
// The labels will not be used - kill them |
|
condBranch.Operand = null; |
|
|
|
result.Add(block); |
|
nodes.Remove(node); |
|
} |
|
|
|
// Two-way branch |
|
if (label != null && |
|
condBranch != null && condBranch.Operand is ILLabel && condBranch.Arguments.Count > 0 && |
|
statBranch != null && statBranch.Operand is ILLabel && statBranch.Arguments.Count == 0) |
|
{ |
|
ControlFlowNode statTarget = null; |
|
labelToCfNode.TryGetValue((ILLabel)statBranch.Operand, out statTarget); |
|
ControlFlowNode condTarget = null; |
|
labelToCfNode.TryGetValue((ILLabel)condBranch.Operand, out condTarget); |
|
|
|
ILCondition condition = new ILCondition() { |
|
Condition = condBranch, |
|
TrueBlock = new ILBlock() { EntryPoint = (ILLabel)condBranch.Operand }, |
|
FalseBlock = new ILBlock() { EntryPoint = (ILLabel)statBranch.Operand } |
|
}; |
|
|
|
// Replace the two branches with a conditional structure - this preserves the node label |
|
block.Body.Remove(condBranch); |
|
block.Body.Remove(statBranch); |
|
block.Body.Add(condition); |
|
|
|
// Pull in the conditional code |
|
HashSet<ControlFlowNode> frontiers = new HashSet<ControlFlowNode>(); |
|
if (statTarget != null) |
|
frontiers.UnionWith(statTarget.DominanceFrontier); |
|
if (condTarget != null) |
|
frontiers.UnionWith(condTarget.DominanceFrontier); |
|
|
|
if (condTarget != null && !frontiers.Contains(condTarget)) { |
|
HashSet<ControlFlowNode> content = FindDominatedNodes(nodes, condTarget); |
|
nodes.ExceptWith(content); |
|
condition.TrueBlock.Body.AddRange(FindConditions(content, condTarget)); |
|
} |
|
if (statTarget != null && !frontiers.Contains(statTarget)) { |
|
HashSet<ControlFlowNode> content = FindDominatedNodes(nodes, statTarget); |
|
nodes.ExceptWith(content); |
|
condition.FalseBlock.Body.AddRange(FindConditions(content, statTarget)); |
|
} |
|
|
|
// The label will not be used - kill it |
|
condBranch.Operand = null; |
|
|
|
result.Add(block); |
|
nodes.Remove(node); |
|
} |
|
} |
|
|
|
// Add the node now so that we have good ordering |
|
if (nodes.Contains(node)) { |
|
result.Add((ILNode)node.UserData); |
|
nodes.Remove(node); |
|
} |
|
} |
|
|
|
// Using the dominator tree should ensure we find the the widest loop first |
|
foreach(var child in node.DominatorTreeChildren) { |
|
agenda.Enqueue(child); |
|
} |
|
} |
|
|
|
// Add whatever is left |
|
foreach(var node in nodes) { |
|
result.Add((ILNode)node.UserData); |
|
} |
|
|
|
return result; |
|
} |
|
|
|
static HashSet<ControlFlowNode> FindDominatedNodes(HashSet<ControlFlowNode> nodes, ControlFlowNode head) |
|
{ |
|
var exitNodes = head.DominanceFrontier.SelectMany(n => n.Predecessors); |
|
HashSet<ControlFlowNode> agenda = new HashSet<ControlFlowNode>(exitNodes); |
|
HashSet<ControlFlowNode> result = new HashSet<ControlFlowNode>(); |
|
|
|
while(agenda.Count > 0) { |
|
ControlFlowNode addNode = agenda.First(); |
|
agenda.Remove(addNode); |
|
|
|
if (nodes.Contains(addNode) && head.Dominates(addNode) && result.Add(addNode)) { |
|
foreach (var predecessor in addNode.Predecessors) { |
|
agenda.Add(predecessor); |
|
} |
|
} |
|
} |
|
if (nodes.Contains(head)) |
|
result.Add(head); |
|
|
|
return result; |
|
} |
|
|
|
/* |
|
|
|
public enum ShortCircuitOperator |
|
{ |
|
LeftAndRight, |
|
LeftOrRight, |
|
NotLeftAndRight, |
|
NotLeftOrRight, |
|
} |
|
|
|
static bool TryOptimizeShortCircuit(Node head) |
|
{ |
|
if ((head is BasicBlock) && |
|
(head as BasicBlock).BranchBasicBlock != null && |
|
(head as BasicBlock).FallThroughBasicBlock != null) { |
|
head.Parent.MergeChilds<SimpleBranch>(head); |
|
return true; |
|
} |
|
|
|
Branch top = head as Branch; |
|
if (top == null) return false; |
|
|
|
Branch left = head.FloatUpToNeighbours(top.TrueSuccessor) as Branch; |
|
Branch right = head.FloatUpToNeighbours(top.FalseSuccessor) as Branch; |
|
|
|
// A & B |
|
if (left != null && |
|
left.Predecessors.Count == 1 && |
|
left.FalseSuccessor == top.FalseSuccessor) { |
|
ShortCircuitBranch scBranch = top.Parent.MergeChilds<ShortCircuitBranch>(top, left); |
|
scBranch.Operator = ShortCircuitOperator.LeftAndRight; |
|
return true; |
|
} |
|
|
|
// ~A | B |
|
if (left != null && |
|
left.Predecessors.Count == 1 && |
|
left.TrueSuccessor == top.FalseSuccessor) { |
|
ShortCircuitBranch scBranch = top.Parent.MergeChilds<ShortCircuitBranch>(top, left); |
|
scBranch.Operator = ShortCircuitOperator.NotLeftOrRight; |
|
return true; |
|
} |
|
|
|
// A | B |
|
if (right != null && |
|
right.Predecessors.Count == 1 && |
|
right.TrueSuccessor == top.TrueSuccessor) { |
|
ShortCircuitBranch scBranch = top.Parent.MergeChilds<ShortCircuitBranch>(top, right); |
|
scBranch.Operator = ShortCircuitOperator.LeftOrRight; |
|
return true; |
|
} |
|
|
|
// ~A & B |
|
if (right != null && |
|
right.Predecessors.Count == 1 && |
|
right.FalseSuccessor == top.TrueSuccessor) { |
|
ShortCircuitBranch scBranch = top.Parent.MergeChilds<ShortCircuitBranch>(top, right); |
|
scBranch.Operator = ShortCircuitOperator.NotLeftAndRight; |
|
return true; |
|
} |
|
|
|
return false; |
|
} |
|
|
|
*/ |
|
|
|
void OrderNodes(ILBlock ast) |
|
{ |
|
// Order movable nodes |
|
var blocks = ast.GetSelfAndChildrenRecursive<ILBlock>().Where(b => !(b is ILMoveableBlock)).ToList(); |
|
ILMoveableBlock first = new ILMoveableBlock() { OriginalOrder = -1 }; |
|
foreach(ILBlock block in blocks) { |
|
block.Body = block.Body.OrderBy(n => (n.GetSelfAndChildrenRecursive<ILMoveableBlock>().FirstOrDefault() ?? first).OriginalOrder).ToList(); |
|
} |
|
} |
|
|
|
/// <summary> |
|
/// Flattens all nested movable blocks, except the the top level 'node' argument |
|
/// </summary> |
|
void FlattenNestedMovableBlocks(ILNode node) |
|
{ |
|
ILBlock block = node as ILBlock; |
|
if (block != null) { |
|
List<ILNode> flatBody = new List<ILNode>(); |
|
if (block.EntryPoint != null) { |
|
flatBody.Add(new ILExpression(OpCodes.Br, block.EntryPoint)); |
|
block.EntryPoint = null; |
|
} |
|
foreach (ILNode child in block.Body) { |
|
FlattenNestedMovableBlocks(child); |
|
if (child is ILMoveableBlock) { |
|
flatBody.AddRange(((ILMoveableBlock)child).Body); |
|
} else { |
|
flatBody.Add(child); |
|
} |
|
} |
|
block.Body = flatBody; |
|
} else if (node is ILExpression) { |
|
// Optimization - no need to check expressions |
|
} else if (node != null) { |
|
// Recursively find all ILBlocks |
|
foreach(ILNode child in node.GetChildren()) { |
|
FlattenNestedMovableBlocks(child); |
|
} |
|
} |
|
} |
|
|
|
void SimpleGotoRemoval(ILBlock ast) |
|
{ |
|
// TODO: Assign IL ranges from br to something else |
|
var blocks = ast.GetSelfAndChildrenRecursive<ILBlock>().ToList(); |
|
foreach(ILBlock block in blocks) { |
|
for (int i = 0; i < block.Body.Count; i++) { |
|
ILExpression expr = block.Body[i] as ILExpression; |
|
// Uncoditional branch |
|
if (expr != null && (expr.OpCode == OpCodes.Br || expr.OpCode == OpCodes.Br_S)) { |
|
// Check that branch is followed by its label (allow multiple labels) |
|
for (int j = i + 1; j < block.Body.Count; j++) { |
|
ILLabel label = block.Body[j] as ILLabel; |
|
if (label == null) |
|
break; // Can not optimize |
|
if (expr.Operand == label) { |
|
block.Body.RemoveAt(i); |
|
break; // Branch removed |
|
} |
|
} |
|
} |
|
} |
|
} |
|
} |
|
|
|
void RemoveDeadLabels(ILBlock ast) |
|
{ |
|
HashSet<ILLabel> liveLabels = new HashSet<ILLabel>(ast.GetSelfAndChildrenRecursive<ILExpression>().SelectMany(e => e.GetBranchTargets())); |
|
var blocks = ast.GetSelfAndChildrenRecursive<ILBlock>().ToList(); |
|
foreach(ILBlock block in blocks) { |
|
for (int i = 0; i < block.Body.Count;) { |
|
ILLabel label = block.Body[i] as ILLabel; |
|
if (label != null && !liveLabels.Contains(label)) { |
|
block.Body.RemoveAt(i); |
|
} else { |
|
i++; |
|
} |
|
} |
|
} |
|
} |
|
} |
|
}
|
|
|