/*
* This file is part of the Jikes RVM project (http://jikesrvm.org).
*
* This file is licensed to You under the Eclipse Public License (EPL);
* You may not use this file except in compliance with the License. You
* may obtain a copy of the License at
*
* http://www.opensource.org/licenses/eclipse-1.0.php
*
* See the COPYRIGHT.txt file distributed with this work for information
* regarding copyright ownership.
*/
package org.jikesrvm.compilers.opt.controlflow;
import static org.jikesrvm.compilers.opt.ir.IRDumpTools.dumpIR;
import static org.jikesrvm.compilers.opt.ir.Operators.ARRAYLENGTH_opcode;
import static org.jikesrvm.compilers.opt.ir.Operators.GOTO;
import static org.jikesrvm.compilers.opt.ir.Operators.GOTO_opcode;
import static org.jikesrvm.compilers.opt.ir.Operators.INT_ADD;
import static org.jikesrvm.compilers.opt.ir.Operators.INT_ADD_opcode;
import static org.jikesrvm.compilers.opt.ir.Operators.INT_AND;
import static org.jikesrvm.compilers.opt.ir.Operators.INT_IFCMP;
import static org.jikesrvm.compilers.opt.ir.Operators.INT_IFCMP_opcode;
import static org.jikesrvm.compilers.opt.ir.Operators.INT_MOVE;
import static org.jikesrvm.compilers.opt.ir.Operators.INT_SUB;
import java.lang.reflect.Constructor;
import java.util.Enumeration;
import java.util.HashMap;
import java.util.Map;
import org.jikesrvm.VM;
import org.jikesrvm.compilers.opt.DefUse;
import org.jikesrvm.compilers.opt.OptOptions;
import org.jikesrvm.compilers.opt.Simple;
import org.jikesrvm.compilers.opt.driver.CompilerPhase;
import org.jikesrvm.compilers.opt.ir.BasicBlock;
import org.jikesrvm.compilers.opt.ir.Binary;
import org.jikesrvm.compilers.opt.ir.ExceptionHandlerBasicBlock;
import org.jikesrvm.compilers.opt.ir.Goto;
import org.jikesrvm.compilers.opt.ir.GuardResultCarrier;
import org.jikesrvm.compilers.opt.ir.GuardedUnary;
import org.jikesrvm.compilers.opt.ir.IR;
import org.jikesrvm.compilers.opt.ir.IfCmp;
import org.jikesrvm.compilers.opt.ir.Instruction;
import org.jikesrvm.compilers.opt.ir.Label;
import org.jikesrvm.compilers.opt.ir.Move;
import org.jikesrvm.compilers.opt.ir.Register;
import org.jikesrvm.compilers.opt.ir.operand.BranchProfileOperand;
import org.jikesrvm.compilers.opt.ir.operand.ConditionOperand;
import org.jikesrvm.compilers.opt.ir.operand.ConstantOperand;
import org.jikesrvm.compilers.opt.ir.operand.IntConstantOperand;
import org.jikesrvm.compilers.opt.ir.operand.Operand;
import org.jikesrvm.compilers.opt.ir.operand.RegisterOperand;
import org.jikesrvm.compilers.opt.util.GraphNode;
import org.jikesrvm.util.BitVector;
public class LoopUnrolling extends CompilerPhase {
static final boolean DEBUG = false;
static final int MAX_BLOCKS_FOR_NAIVE_UNROLLING = 20;
private final Map<BasicBlock, BasicBlock> copiedBlocks;
private int theVisit = 1;
private Map<Instruction, Integer> visitInts;
public LoopUnrolling() {
copiedBlocks = new HashMap<BasicBlock, BasicBlock>();
}
/**
* Returns the name of the phase.
*/
@Override
public String getName() {
return "Loop Unrolling";
}
/**
* Constructor for this compiler phase
*/
private static final Constructor<CompilerPhase> constructor =
getCompilerPhaseConstructor(LoopUnrolling.class);
/**
* Get a constructor object for this compiler phase
* @return compiler phase constructor
*/
@Override
public Constructor<CompilerPhase> getClassConstructor() {
return constructor;
}
/**
* This phase is disabled by default.
* <p>
* It will run only on O3 but O2 is the default maximum optimization level.
*/
@Override
public boolean shouldPerform(OptOptions options) {
return ((options.getOptLevel() >= 3) && (options.CONTROL_UNROLL_LOG >= 1) && (!options.SSA_LOOP_VERSIONING));
}
@Override
public void perform(IR ir) {
unrollFactor = (1 << ir.options.CONTROL_UNROLL_LOG);
if (ir.hasReachableExceptionHandlers()) return;
DefUse.computeDU(ir);
new Simple(1, true, true, true, false).perform(ir);
new BranchOptimizations(-1, true, true).perform(ir, true);
//new CFGTransformations().perform(ir);
// Note: the following unfactors the CFG
new DominatorsPhase(true).perform(ir);
DefUse.computeDU(ir);
visitInts = new HashMap<Instruction, Integer>();
Enumeration<Instruction> instEnum = ir.forwardInstrEnumerator();
while (instEnum.hasMoreElements()) {
Instruction inst = instEnum.nextElement();
visitInts.put(inst, Integer.valueOf(0));
}
unrollLoops(ir);
CFGTransformations.splitCriticalEdges(ir);
ir.cfg.compactNodeNumbering();
}
void unrollLoops(IR ir) {
LSTGraph lstg = ir.HIRInfo.loopStructureTree;
for (int i = 1; lstg != null && i <= 1; ++i) {
unrollLoopTree((LSTNode) lstg.firstNode(), ir, i);
(new BuildLST()).perform(ir);
}
}
int unrollLoopTree(LSTNode t, IR ir, int target) {
int height = 1;
Enumeration<GraphNode> e = t.outNodes();
if (!e.hasMoreElements()) {
if (t.loop != null) {
report("Leaf loop in " + ir.method + ": " + t.loop);
// check infrequency
if (t.header.getInfrequent()) {
report("no unrolling of infrequent loop");
} else {
boolean doNaiveUnrolling = height == target && unrollLeaf(t, ir);
if (doNaiveUnrolling) naiveUnroller(t, ir);
}
}
} else {
while (e.hasMoreElements()) {
LSTNode n = (LSTNode) e.nextElement();
int heightOfTree = unrollLoopTree(n, ir, target);
height = Math.max(height, heightOfTree) + 1;
}
}
return height;
}
static final int MaxInstructions = 100;
private int unrollFactor = 1;
boolean unrollLeaf(LSTNode t, IR ir) {
int instructionsInLoop = 0;
BasicBlock exitBlock = null, backEdgeBlock = null, succBlock = null, predBlock = null;
BitVector nloop = t.loop;
BasicBlock header = t.header;
Instruction tmp;
if (ir.hasReachableExceptionHandlers()) {
report("0 IR may have exception handlers");
return false;
}
// determine loop structure by looking at its blocks
Enumeration<BasicBlock> loopBlocks = ir.getBasicBlocks(nloop);
int blocks = 0;
while (loopBlocks.hasMoreElements()) {
BasicBlock b = loopBlocks.nextElement();
blocks++;
// check for size
instructionsInLoop += b.getNumberOfRealInstructions();
if (instructionsInLoop > MaxInstructions) {
report("1 is too big");
return false;
}
// look at the in edges. We want the header to be the only
// block with out of loop incoming edges.
Enumeration<BasicBlock> e = b.getIn();
if (b != header) {
while (e.hasMoreElements()) {
BasicBlock o = e.nextElement();
if (!CFGTransformations.inLoop(o, nloop)) {
report("2 interior pointers.");
return true;
}
}
} else {
// check the headers predecessors: there should be
// one out of loop input and one backedge.
// We can extend this for loops with several backedges,
// if they all have the same conditions.
int inEdges = 0;
while (e.hasMoreElements()) {
inEdges++;
BasicBlock o = e.nextElement();
if (!CFGTransformations.inLoop(o, nloop)) {
if (predBlock == null) {
predBlock = o;
} else {
report("3 multi entry header.");
return true;
}
} else {
if (backEdgeBlock == null) {
backEdgeBlock = o;
} else {
report("4 multiple back edges.");
return true;
}
}
}
}
// look at the out edges to find loop exits
e = b.getOut();
while (e.hasMoreElements()) {
BasicBlock out = e.nextElement();
if (!CFGTransformations.inLoop(out, nloop)) {
if (exitBlock == null) {
exitBlock = b;
} else {
report("5 multiple exit blocks.");
return true;
}
}
}
}
// exitBlock must equal backEdgeBlock
if (exitBlock == null) {
report("6 no exit block found...infinite loop?");
return true;
}
if (exitBlock != backEdgeBlock) {
report("7 exit block is not immediate predecessor of loop head");
return true;
}
// exitBlock must exit (skip over pads in critical edges)
while (exitBlock.getNumberOfOut() == 1 && exitBlock.getNumberOfIn() == 1) {
exitBlock = exitBlock.getIn().nextElement();
}
if (exitBlock == header && blocks > 1) {
report("6 while loop? (" + blocks + ")");
return true;
}
// So far, so good. Examine the exit test.
Instruction origBranch = exitBlock.firstBranchInstruction();
if (origBranch != exitBlock.lastRealInstruction()) {
Instruction aGoto = origBranch.nextInstructionInCodeOrder();
if (aGoto.getOpcode() != GOTO_opcode) {
report("7 too complex exit");
return true;
}
succBlock = Label.getBlock(Goto.getTarget(aGoto).target).block;
if (VM.VerifyAssertions) {
VM._assert(aGoto == exitBlock.lastRealInstruction());
}
} else {
succBlock = exitBlock.getFallThroughBlock();
}
if (origBranch.getOpcode() != INT_IFCMP_opcode) {
report("8 branch isn't int_ifcmp: " + origBranch.operator() + ".");
return true;
}
// examine operands:
Operand op1 = follow(IfCmp.getVal1(origBranch));
Operand op2 = follow(IfCmp.getVal2(origBranch));
ConditionOperand cond = (ConditionOperand) IfCmp.getCond(origBranch).copy();
RegisterOperand ifcmpGuard = IfCmp.getGuardResult(origBranch);
float backBranchProbability = IfCmp.getBranchProfile(origBranch).takenProbability;
if (!loopInvariant(op2, nloop, 4)) {
if (loopInvariant(op1, nloop, 4)) {
Operand op = op1;
op1 = op2;
op2 = op;
cond.flipOperands();
} else {
if (DEBUG) {
printDefs(op1, nloop, 4);
printDefs(op2, nloop, 4);
VM.sysWriteln(origBranch.toString());
}
report("8a op1 and op2 may not be loop invariant");
return true;
}
}
BasicBlock target = Label.getBlock(IfCmp.getTarget(origBranch).target).block;
if (!(op1 instanceof RegisterOperand)) {
report("9 op1 of ifcmp isn't a register");
return true;
}
RegisterOperand rop1 = (RegisterOperand) op1;
Register reg = rop1.getRegister();
if (reg.isPhysical()) {
report("10 loops over physical register");
return false;
}
if (succBlock == header && !CFGTransformations.inLoop(target, nloop)) {
succBlock = target;
target = header;
cond.flipCode();
}
if (target != header) {
report("11 ifcmp doesn't jump to header");
return true;
}
Instruction iterator = null;
Enumeration<Operand> defs = new RealDefs(rop1);
while (defs.hasMoreElements()) {
Operand def = defs.nextElement();
Instruction inst = def.instruction;
BasicBlock block = inst.getBasicBlock();
//VM.sysWriteln(block + ": " + inst);
if (CFGTransformations.inLoop(block, nloop)) {
if (iterator == null) {
iterator = inst;
} else {
report("12 iterator not unique.");
return true;
}
}
}
if (iterator == null) {
report("15 iterator not found.");
return true;
}
if (iterator.getOpcode() != INT_ADD_opcode) {
//dumpIR (ir, "malformed");
report("16 iterator is no addition: " + iterator.operator());
return true;
}
if (!rop1.similar(follow(Binary.getVal1(iterator)))) {
//dumpIR (ir, "malformed");
report("17 malformed iterator.\n" + iterator);
return true;
}
Operand strideOp = follow(Binary.getVal2(iterator));
if (!(strideOp instanceof IntConstantOperand)) {
report("18 stride not constant");
return true;
}
int stride = ((IntConstantOperand) strideOp).value;
if (stride != 1 && stride != -1) {
report("18b stride != +/-1 (" + stride + ")");
return true;
}
if ((stride == 1 &&
((cond.value != ConditionOperand.LESS) &&
cond.value != ConditionOperand.LESS_EQUAL &&
cond.value != ConditionOperand.NOT_EQUAL)) ||
(stride == -1 &&
((cond.value != ConditionOperand.GREATER) &&
cond.value != ConditionOperand.GREATER_EQUAL &&
cond.value != ConditionOperand.NOT_EQUAL))) {
report("19 unexpected condition: " + cond + "\n" + iterator + "\n" + origBranch);
return true;
}
RegisterOperand outerGuard;
BasicBlock outer = predBlock;
while (outer.getNumberOfOut() == 1 && outer.getNumberOfIn() == 1) {
outer = outer.getIn().nextElement();
}
if (outer.getNumberOfIn() > 0 && outer.getNumberOfOut() < 2) {
report("23 no suitable outer guard found.");
return true;
}
tmp = outer.firstBranchInstruction();
if (tmp != null && GuardResultCarrier.conforms(tmp)) {
outerGuard = GuardResultCarrier.getGuardResult(tmp);
} else {
outerGuard = ir.regpool.makeTempValidation();
}
////////////
// transfom
// transform this:
//
// Orig:
// B
// if i CC b goto Orig
// else goto exit
//
// exit:
//
// into this:
//
//
// stride == 1: common: stride == -1:
//--------------------------------------------------------------------------
// guard0:
// limit = b;
// if a > b goto Orig if b > a goto Orig
// else guard1
//
//
// guard 1:
// remainder = b - a; remainder = a - b;
// if cond == '<=' if cond == '>='
// remainder++; remainder++;
// remainder = remainder & 3
// limit = a + remainder limit = a - remainder
// if cond == '<=' if cond == '>='
// limit--; limit++;
// if remainder == 0 goto mllp
// goto Orig
//
// Orig:
// LOOP;
// if i CC limit goto Orig
// else guard2
//
// guard2: if i CC b goto mllp
// else exit
//
// mllp: // landing pad
// goto ml
//
// ml:
// LOOP;LOOP;LOOP;LOOP;
// if i CC b goto ml
// else exit
//
// exit:
//--------------------------------------------------------------------------
report("...transforming.");
if (DEBUG && ir.options.hasMETHOD_TO_PRINT() && ir.options.fuzzyMatchMETHOD_TO_PRINT(ir.method.toString())) {
dumpIR(ir, "before unroll");
}
CFGTransformations.killFallThroughs(ir, nloop);
BasicBlock[] handles = makeSomeCopies(unrollFactor, ir, nloop, blocks, header, exitBlock, exitBlock);
BasicBlock mainHeader = handles[0];
BasicBlock mainExit = handles[1];
// test block for well formed bounds
BasicBlock guardBlock0 = header.createSubBlock(header.firstInstruction().getBytecodeIndex(), ir);
predBlock.redirectOuts(header, guardBlock0, ir);
// test block for iteration alignemnt
BasicBlock guardBlock1 = header.createSubBlock(header.firstInstruction().getBytecodeIndex(), ir);
// landing pad for orig loop
BasicBlock olp = header.createSubBlock(header.firstInstruction().getBytecodeIndex(), ir);
olp.setLandingPad();
BasicBlock predSucc = predBlock.nextBasicBlockInCodeOrder();
if (predSucc != null) {
ir.cfg.breakCodeOrder(predBlock, predSucc);
ir.cfg.linkInCodeOrder(olp, predSucc);
}
ir.cfg.linkInCodeOrder(predBlock, guardBlock0);
ir.cfg.linkInCodeOrder(guardBlock0, guardBlock1);
ir.cfg.linkInCodeOrder(guardBlock1, olp);
// guard block for main loop
BasicBlock guardBlock2 = header.createSubBlock(header.firstInstruction().getBytecodeIndex(), ir);
// landing pad for main loop
BasicBlock landingPad = header.createSubBlock(header.firstInstruction().getBytecodeIndex(), ir);
landingPad.setLandingPad();
BasicBlock mainLoop = exitBlock.nextBasicBlockInCodeOrder();
ir.cfg.breakCodeOrder(exitBlock, mainLoop);
ir.cfg.linkInCodeOrder(exitBlock, guardBlock2);
ir.cfg.linkInCodeOrder(guardBlock2, landingPad);
ir.cfg.linkInCodeOrder(landingPad, mainLoop);
RegisterOperand remainder = ir.regpool.makeTemp(rop1.getType());
RegisterOperand limit = ir.regpool.makeTemp(rop1.getType());
// test whether a <= b for stride == 1 and a >= b for stride == -1
tmp = guardBlock0.lastInstruction();
tmp.insertBefore(Move.create(INT_MOVE, limit, op2.copy()));
ConditionOperand g0cond = ConditionOperand.GREATER_EQUAL();
if (stride == -1) g0cond = ConditionOperand.LESS_EQUAL();
tmp.insertBefore(IfCmp.create(INT_IFCMP,
outerGuard.copyD2D(),
rop1.copyD2U(),
op2.copy(),
g0cond,
olp.makeJumpTarget(),
BranchProfileOperand.unlikely()));
tmp.insertBefore(Goto.create(GOTO, guardBlock1.makeJumpTarget()));
// align the loop iterations
tmp = guardBlock1.lastInstruction();
if (stride == 1) {
tmp.insertBefore(Binary.create(INT_SUB, remainder, op2.copy(), rop1.copyD2U()));
} else {
tmp.insertBefore(Binary.create(INT_SUB, remainder, rop1.copyD2U(), op2.copy()));
}
if (cond.isGREATER_EQUAL() || cond.isLESS_EQUAL()) {
tmp.insertBefore(Binary.create(INT_ADD, remainder.copyD2D(), remainder.copyD2U(), new IntConstantOperand(1)));
}
tmp.insertBefore(Binary.create(INT_ADD, remainder.copyD2D(), remainder.copyD2U(), new IntConstantOperand(-1)));
tmp.insertBefore(Binary.create(INT_AND,
remainder.copyD2D(),
remainder.copyD2U(),
new IntConstantOperand(unrollFactor - 1)));
tmp.insertBefore(Binary.create(INT_ADD, remainder.copyD2D(), remainder.copyD2U(), new IntConstantOperand(1)));
if (stride == 1) {
tmp.insertBefore(Binary.create(INT_ADD, limit.copyD2U(), op1.copy(), remainder.copyD2U()));
} else {
tmp.insertBefore(Binary.create(INT_SUB, limit.copyD2U(), op1.copy(), remainder.copyD2U()));
}
if (cond.isLESS_EQUAL()) {
tmp.insertBefore(Binary.create(INT_ADD, limit.copyD2D(), limit.copyD2U(), new IntConstantOperand(-1)));
}
if (cond.isGREATER_EQUAL()) {
tmp.insertBefore(Binary.create(INT_ADD, limit.copyD2D(), limit.copyD2U(), new IntConstantOperand(1)));
}
tmp.insertBefore(Goto.create(GOTO, olp.makeJumpTarget()));
// build landing pad for original loop
tmp = olp.lastInstruction();
tmp.insertBefore(Goto.create(GOTO, header.makeJumpTarget()));
// change the back branch in the original loop
deleteBranches(exitBlock);
tmp = exitBlock.lastInstruction();
tmp.insertBefore(IfCmp.create(INT_IFCMP,
outerGuard.copyD2D(),
rop1.copyU2U(),
limit.copyD2U(),
(ConditionOperand) cond.copy(),
header.makeJumpTarget(),
new BranchProfileOperand(1.0f - 1.0f / (unrollFactor / 2))));
tmp.insertBefore(Goto.create(GOTO, guardBlock2.makeJumpTarget()));
// only enter main loop if iterations left
tmp = guardBlock2.lastInstruction();
tmp.insertBefore(IfCmp.create(INT_IFCMP,
outerGuard.copyD2D(),
rop1.copyU2U(),
op2.copy(),
(ConditionOperand) cond.copy(),
landingPad.makeJumpTarget(),
new BranchProfileOperand(backBranchProbability)));
tmp.insertBefore(Goto.create(GOTO, succBlock.makeJumpTarget()));
// landing pad jumps to mainHeader
tmp = landingPad.lastInstruction();
tmp.insertBefore(Goto.create(GOTO, mainHeader.makeJumpTarget()));
// repair back edge in mainExit
if (VM.VerifyAssertions) VM._assert(mainExit != null);
tmp = mainExit.lastInstruction();
if (VM.VerifyAssertions) {
VM._assert((mainExit.lastRealInstruction() == null) || !mainExit.lastRealInstruction().isBranch());
}
tmp.insertBefore(IfCmp.create(INT_IFCMP,
ifcmpGuard.copyU2U(),
rop1.copyU2U(),
op2.copy(),
(ConditionOperand) cond.copy(),
mainHeader.makeJumpTarget(),
new BranchProfileOperand(1.0f - (1.0f - backBranchProbability) * unrollFactor)));
tmp.insertBefore(Goto.create(GOTO, succBlock.makeJumpTarget()));
// recompute normal outs
guardBlock0.recomputeNormalOut(ir);
guardBlock1.recomputeNormalOut(ir);
olp.recomputeNormalOut(ir);
guardBlock2.recomputeNormalOut(ir);
exitBlock.recomputeNormalOut(ir);
landingPad.recomputeNormalOut(ir);
mainExit.recomputeNormalOut(ir);
if (DEBUG && ir.options.hasMETHOD_TO_PRINT() && ir.options.fuzzyMatchMETHOD_TO_PRINT(ir.method.toString())) {
dumpIR(ir, "after unroll");
}
return false;
}
private void naiveUnroller(LSTNode t, IR ir) {
BitVector nloop = t.loop;
BasicBlock seqStart = null;
Enumeration<BasicBlock> bs;
if (t.loop.populationCount() > MAX_BLOCKS_FOR_NAIVE_UNROLLING) {
report("1 is too big");
return;
}
report("Naively unrolling");
CFGTransformations.killFallThroughs(ir, nloop);
// first, capture the blocks in the loop body.
int bodyBlocks = nloop.populationCount();
BasicBlock[] body = new BasicBlock[bodyBlocks];
{
int i = 0;
bs = ir.getBasicBlocks(nloop);
while (bs.hasMoreElements()) {
BasicBlock b = bs.nextElement();
if (VM.VerifyAssertions) {
VM._assert(!(b instanceof ExceptionHandlerBasicBlock));
}
body[i++] = b;
BasicBlock next = b.nextBasicBlockInCodeOrder();
if (next == null || !CFGTransformations.inLoop(next, nloop)) {
seqStart = b; // end of loop in code order
}
}
}
BasicBlock seqEnd = seqStart.nextBasicBlockInCodeOrder();
if (seqEnd != null) ir.cfg.breakCodeOrder(seqStart, seqEnd);
BasicBlock seqLast = seqStart;
BasicBlock firstHeaderCopy = null;
BasicBlock currentBlock = seqLast;
for (int i = 1; i <= unrollFactor; ++i) {
// copy body
for (BasicBlock bb : body) {
seqLast = copyAndLinkBlock(ir, seqLast, bb);
if (bb == t.header) {
if (firstHeaderCopy == null) {
firstHeaderCopy = seqLast;
}
}
}
// redirect internal branches
currentBlock = seqLast;
for (int j = 0; j < bodyBlocks; ++j) {
currentBlock.recomputeNormalOut(ir);
Enumeration<BasicBlock> be = currentBlock.getOut();
while (be.hasMoreElements()) {
BasicBlock out = be.nextElement();
if (out != t.header && CFGTransformations.inLoop(out, nloop)) {
BasicBlock outCopy = copiedBlocks.get(out);
currentBlock.redirectOuts(out, outCopy, ir);
}
}
currentBlock.recomputeNormalOut(ir);
currentBlock = currentBlock.prevBasicBlockInCodeOrder();
}
if (i != 1) {
// redirect the branches to the header in the (i-1)th copy
for (int j = 0; j < bodyBlocks; ++j) {
Enumeration<BasicBlock> be = currentBlock.getOut();
while (be.hasMoreElements()) {
BasicBlock out = be.nextElement();
if (out == t.header) {
BasicBlock headerCopy;
headerCopy = copiedBlocks.get(t.header);
currentBlock.redirectOuts(t.header, headerCopy, ir);
}
}
currentBlock.recomputeNormalOut(ir);
currentBlock = currentBlock.prevBasicBlockInCodeOrder();
}
}
}
if (seqEnd != null) ir.cfg.linkInCodeOrder(seqLast, seqEnd);
// in the original loop, redirect branches that go to the header
// and make them point to the first header copy
for (int j = 0; j < bodyBlocks; ++j) {
Enumeration<BasicBlock> be = body[j].getOut();
while (be.hasMoreElements()) {
BasicBlock out = be.nextElement();
if (out == t.header) {
body[j].redirectOuts(t.header, firstHeaderCopy, ir);
}
}
body[j].recomputeNormalOut(ir);
}
// the following loop redirects backedges that start in the last
// copy to point to the first copy instead and not to the original
// header.
// | |
// Thus we get [ ] instead of [ ]<-.
// | | |
// [ ]<-. [ ] |
// | | | |
// [ ] | [ ] |
// | | | |
// [ ] | [ ] |
// |\_/ |\_/
//
// Instead of 2^(unroll_log) we only have 2^(unroll_log-1) bodies
// in the unrolled loop, but there is one copy of the loop's body
// that dominates the unrolled version. Peeling of this first
// version should have benefits for global code placement.
currentBlock = seqLast;
for (int j = 0; j < bodyBlocks; ++j) {
Enumeration<BasicBlock> be = currentBlock.getOut();
while (be.hasMoreElements()) {
BasicBlock out = be.nextElement();
if (out == t.header) {
currentBlock.redirectOuts(t.header, firstHeaderCopy, ir);
}
}
currentBlock.recomputeNormalOut(ir);
currentBlock = currentBlock.prevBasicBlockInCodeOrder();
}
}
static void report(String s) {
if (DEBUG) VM.sysWriteln("] " + s);
}
private Operand follow(Operand use) {
theVisit++;
return _follow(use);
}
private Operand _follow(Operand use) {
while (true) {
if (!(use instanceof RegisterOperand)) return use;
RegisterOperand rop = (RegisterOperand) use;
Enumeration<RegisterOperand> defs = DefUse.defs(rop.getRegister());
if (!defs.hasMoreElements()) {
return use;
}
Instruction def = defs.nextElement().instruction;
if (!Move.conforms(def)) return use;
if (defs.hasMoreElements()) {
return use;
}
Integer defInt = visitInts.get(def);
if (defInt.intValue() == theVisit) {
return use;
}
visitInts.put(def, Integer.valueOf(theVisit));
use = Move.getVal(def);
}
}
private static Instruction definingInstruction(Operand op) {
if (!(op instanceof RegisterOperand)) return op.instruction;
Enumeration<RegisterOperand> defs = DefUse.defs(((RegisterOperand) op).getRegister());
if (!defs.hasMoreElements()) {
return op.instruction;
}
Instruction def = defs.nextElement().instruction;
if (defs.hasMoreElements()) {
return op.instruction;
}
return def;
}
private static boolean loopInvariant(Operand op, BitVector nloop, int depth) {
if (depth <= 0) {
return false;
} else if (op instanceof ConstantOperand) {
return true;
} else if (op instanceof RegisterOperand) {
Register reg = ((RegisterOperand) op).getRegister();
Enumeration<RegisterOperand> defs = DefUse.defs(reg);
// if no definitions of this register (very strange) give up
if (!defs.hasMoreElements()) return false;
Instruction inst = defs.nextElement().instruction;
// if multiple definitions of a register give up as follow may
// fail to give the correct invariant
return !defs.hasMoreElements() && !CFGTransformations.inLoop(inst.getBasicBlock(), nloop);
} else {
return false;
}
}
private static boolean printDefs(Operand op, BitVector nloop, int depth) {
if (depth <= 0) return false;
if (op instanceof ConstantOperand) {
VM.sysWriteln(">> " + op);
return true;
}
if (op instanceof RegisterOperand) {
boolean invariant = true;
Register reg = ((RegisterOperand) op).getRegister();
Enumeration<RegisterOperand> defs = DefUse.defs(reg);
while (defs.hasMoreElements()) {
Instruction inst = defs.nextElement().instruction;
VM.sysWriteln(">> " + inst.getBasicBlock() + ": " + inst);
if (CFGTransformations.inLoop(inst.getBasicBlock(), nloop)) {
if (Move.conforms(inst)) {
invariant &= printDefs(Move.getVal(inst), nloop, depth - 1);
} else if (inst.getOpcode() == ARRAYLENGTH_opcode) {
invariant &= printDefs(GuardedUnary.getVal(inst), nloop, depth);
} else {
invariant = false;
}
}
if (!invariant) break;
}
return invariant;
}
return false;
}
@SuppressWarnings("unused")
// For debugging
private void _printDefs(Operand op) {
if (op instanceof RegisterOperand) {
Register reg = ((RegisterOperand) op).getRegister();
Enumeration<RegisterOperand> defs = DefUse.defs(reg);
defs = DefUse.defs(reg);
while (defs.hasMoreElements()) {
Instruction inst = defs.nextElement().instruction;
if (Move.conforms(inst)) {
inst = definingInstruction(follow(Move.getVal(inst)));
}
VM.sysWriteln(">> " + inst.getBasicBlock() + ": " + inst);
}
} else {
VM.sysWriteln(">> " + op);
}
}
// inserts unrollFactor copies of the loop after seqStart
BasicBlock[] makeSomeCopies(int unrollFactor, IR ir, BitVector nloop, int blocks,
BasicBlock header, BasicBlock exitBlock, BasicBlock seqStart) {
// make some copies of the original loop
// first, capture the blocks in the loop body.
BitVector loop = new BitVector(nloop);
loop.clear(header.getNumber());
loop.clear(exitBlock.getNumber());
int bodyBlocks = 0;
Enumeration<BasicBlock> bs = ir.getBasicBlocks(loop);
while (bs.hasMoreElements()) {
bodyBlocks++;
bs.nextElement();
}
BasicBlock[] body = new BasicBlock[bodyBlocks];
{
int i = 0;
bs = ir.getBasicBlocks(loop);
while (bs.hasMoreElements()) {
body[i++] = bs.nextElement();
}
}
BasicBlock seqEnd = seqStart.nextBasicBlockInCodeOrder();
if (seqEnd != null) ir.cfg.breakCodeOrder(seqStart, seqEnd);
BasicBlock seqLast = seqStart;
BasicBlock firstHeader = null;
BasicBlock lastHeader = null;
BasicBlock lastExit = null;
BasicBlock[] handles = new BasicBlock[2];
for (int i = 0; i < unrollFactor; ++i) {
// copy header
seqLast = copyAndLinkBlock(ir, seqLast, header);
lastHeader = seqLast;
if (i == 0) {
firstHeader = seqLast;
} else {
// link copies by jumps
lastExit.appendInstruction(Goto.create(GOTO, seqLast.makeJumpTarget()));
lastExit.recomputeNormalOut(ir);
}
// copy body
for (BasicBlock bb : body) {
seqLast = copyAndLinkBlock(ir, seqLast, bb);
}
// copy exit block
if (exitBlock != header) {
seqLast = copyAndLinkBlock(ir, seqLast, exitBlock);
lastExit = seqLast;
} else {
lastExit = lastHeader;
}
// delete all branches in the copies of the exit block
deleteBranches(lastExit);
// redirect internal branches
BasicBlock cb = seqLast;
for (int j = 0; j < blocks; ++j) {
cb.recomputeNormalOut(ir);
Enumeration<BasicBlock> be = cb.getOut();
while (be.hasMoreElements()) {
BasicBlock out = be.nextElement();
if (CFGTransformations.inLoop(out, nloop)) {
cb.redirectOuts(out, copiedBlocks.get(out), ir);
}
}
cb.recomputeNormalOut(ir);
cb = cb.prevBasicBlockInCodeOrder();
}
}
if (seqEnd != null) ir.cfg.linkInCodeOrder(seqLast, seqEnd);
handles[0] = firstHeader;
handles[1] = lastExit;
return handles;
}
BasicBlock copyAndLinkBlock(IR ir, BasicBlock seqLast, BasicBlock block) {
BasicBlock copy = block.copyWithoutLinks(ir);
ir.cfg.linkInCodeOrder(seqLast, copy);
copiedBlocks.put(block, copy);
return copy;
}
static void deleteBranches(BasicBlock b) {
Instruction branch = b.lastRealInstruction();
while (branch.isBranch()) {
Instruction nextBranch = branch.prevInstructionInCodeOrder();
branch.remove();
branch = nextBranch;
}
}
final class RealDefs implements Enumeration<Operand> {
private Enumeration<RegisterOperand> defs = null;
private Operand use;
private RealDefs others = null;
private void init(Operand use) {
this.use = use;
if (use instanceof RegisterOperand) {
RegisterOperand rop = (RegisterOperand) use;
defs = DefUse.defs(rop.getRegister());
this.use = null;
if (!defs.hasMoreElements()) defs = null;
}
}
RealDefs(Operand use) {
this.init(use);
theVisit++;
}
RealDefs(Operand use, int visit) {
this.init(use);
theVisit = visit;
}
@Override
public boolean hasMoreElements() {
return use != null || (others != null && others.hasMoreElements()) || (defs != null && defs.hasMoreElements());
}
@Override
public Operand nextElement() {
Operand res = use;
if (res != null) {
use = null;
return res;
}
if (others != null && others.hasMoreElements()) {
return others.nextElement();
}
res = defs.nextElement();
Instruction inst = res.instruction;
if (!(Move.conforms(inst)) || visitInts.get(inst).intValue() == theVisit) {
return res;
}
visitInts.put(inst, Integer.valueOf(theVisit));
others = new RealDefs(Move.getVal(inst), theVisit);
if (!(others.hasMoreElements())) return res;
return others.nextElement();
}
public Operand nextClear() {
Operand res = nextElement();
res.instruction = null;
return res;
}
}
}