mirror of
https://gitlab.com/freepascal.org/fpc/source.git
synced 2025-05-05 11:52:33 +02:00

* changed command line options meanings for optimizer: O2 now means peepholopts, CSE and register renaming in 1 pass O3 is the same, but repeated until no further optimizations are possible or until 5 passes have been done (to avoid endless loops) * changed aopt386 so it does this looping * added some procedures from csopt386 to the interface because they're used by rropt386 as well * some changes to csopt386 and daopt386 so that newly added instructions by the CSE get optimizer info (they were simply skipped previously), this fixes some bugs
1754 lines
71 KiB
ObjectPascal
1754 lines
71 KiB
ObjectPascal
{
|
|
$Id$
|
|
Copyright (c) 1998-2000 by Jonas Maebe, member of the Free Pascal
|
|
development team
|
|
|
|
This unit contains the common subexpression elimination procedure.
|
|
|
|
This program is free software; you can redistribute it and/or modify
|
|
it under the terms of the GNU General Public License as published by
|
|
the Free Software Foundation; either version 2 of the License, or
|
|
(at your option) any later version.
|
|
|
|
This program is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with this program; if not, write to the Free Software
|
|
Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
|
|
|
|
****************************************************************************
|
|
}
|
|
Unit CSOpt386;
|
|
|
|
{$i defines.inc}
|
|
|
|
Interface
|
|
|
|
Uses aasm, cpubase, cpuasm;
|
|
|
|
function CSE(asmL: paasmoutput; first, last: pai; pass: longint): boolean;
|
|
|
|
function doReplaceReg(hp: paicpu; newReg, orgReg: tregister): boolean;
|
|
function changeOp(var o: toper; newReg, orgReg: tregister): boolean;
|
|
function storeBack(p1: pai; orgReg, newReg: tregister): boolean;
|
|
function NoHardCodedRegs(p: paicpu; orgReg, newReg: TRegister): boolean;
|
|
function RegSizesOK(oldReg,newReg: TRegister; p: paicpu): boolean;
|
|
|
|
Implementation
|
|
|
|
Uses
|
|
{$ifdef replaceregdebug}cutils,{$endif}
|
|
globtype, verbose, hcodegen, globals, daopt386, tgeni386, rropt386;
|
|
|
|
{
|
|
Function PaiInSequence(P: Pai; Const Seq: TContent): Boolean;
|
|
Var P1: Pai;
|
|
Counter: Byte;
|
|
TmpResult: Boolean;
|
|
Begin
|
|
TmpResult := False;
|
|
P1 := Seq.StartMod;
|
|
Counter := 1;
|
|
While Not(TmpResult) And
|
|
(Counter <= Seq.NrOfMods) Do
|
|
Begin
|
|
If (P = P1) Then TmpResult := True;
|
|
Inc(Counter);
|
|
p1 := Pai(p1^.Next);
|
|
End;
|
|
PaiInSequence := TmpResult;
|
|
End;
|
|
}
|
|
|
|
function modifiesConflictingMemLocation(p1: pai; reg: tregister; c: tregContent;
|
|
var regsStillValid: tregset): boolean;
|
|
var
|
|
p, hp: paicpu;
|
|
tmpRef: treference;
|
|
regCounter: tregister;
|
|
opCount: byte;
|
|
begin
|
|
modifiesConflictingMemLocation := false;
|
|
if p1^.typ <> ait_instruction then
|
|
exit;
|
|
p := paicpu(p1);
|
|
case p^.opcode of
|
|
A_MOV,A_MOVSX,A_MOVZX:
|
|
if p^.oper[1].typ = top_ref then
|
|
for regCounter := R_EAX to R_EDI do
|
|
begin
|
|
if writeToMemDestroysContents(reg32(p^.oper[0].reg),p^.oper[1].ref^,
|
|
regCounter,c[regCounter]) then
|
|
begin
|
|
exclude(regsStillValid,regCounter);
|
|
modifiesConflictingMemLocation := not(reg in regsStillValid);
|
|
end;
|
|
end
|
|
else
|
|
{ if is_reg_var[reg32(p^.oper[1].reg)] then }
|
|
for regCounter := R_EAX to R_EDI do
|
|
begin
|
|
if writeDestroysContents(p^.oper[1],regCounter,c[regCounter]) then
|
|
begin
|
|
exclude(regsStillValid,regCounter);
|
|
modifiesConflictingMemLocation := not(reg in regsStillValid);
|
|
end
|
|
end;
|
|
A_DIV, A_IDIV, A_MUL, A_IMUL:
|
|
begin
|
|
if (p^.ops = 1) then
|
|
begin
|
|
if is_reg_var[R_EDX] and
|
|
(not getNextInstruction(p,hp) or
|
|
not((hp^.typ = ait_instruction) and
|
|
(hp^.opcode = A_MOV) and
|
|
(hp^.oper[0].typ = top_reg) and
|
|
(reg32(hp^.oper[0].reg) = R_EDX) and
|
|
getNextInstruction(hp,hp) and
|
|
(hp^.typ = ait_instruction) and
|
|
(hp^.opcode = A_POP) and
|
|
(hp^.oper[0].reg = R_EDX))) then
|
|
for regCounter := R_EAX to R_EDI do
|
|
if writeToRegDestroysContents(R_EDX,regCounter,c[regCounter]) then
|
|
begin
|
|
exclude(regsStillValid,R_EDX);
|
|
modifiesConflictingMemLocation := not(reg in regsStillValid);
|
|
end
|
|
end
|
|
else
|
|
{ only possible for imul }
|
|
{ last operand is always destination }
|
|
if is_reg_var[reg32(p^.oper[p^.ops-1].reg)] then
|
|
for regCounter := R_EAX to R_EDI do
|
|
begin
|
|
if writeDestroysContents(p^.oper[p^.ops-1],regCounter,c[regCounter]) then
|
|
begin
|
|
exclude(regsStillValid,regCounter);
|
|
modifiesConflictingMemLocation := not(reg in regsStillValid);
|
|
end
|
|
end
|
|
end;
|
|
else
|
|
for opCount := 1 to MaxCh do
|
|
case InsProp[p^.opcode].Ch[opCount] of
|
|
Ch_MOp1,CH_WOp1,CH_RWOp1:
|
|
{ if (p^.oper[0].typ = top_ref) or }
|
|
{ ((p^.oper[0].typ = top_reg) and }
|
|
{ is_reg_var[reg32(p^.oper[0].reg)]) then }
|
|
for regCounter := R_EAX to R_EDI do
|
|
if writeDestroysContents(p^.oper[0],regCounter,c[regCounter]) then
|
|
begin
|
|
exclude(regsStillValid,regCounter);
|
|
modifiesConflictingMemLocation := not(reg in regsStillValid);
|
|
end;
|
|
Ch_MOp2,CH_WOp2,CH_RWOp2:
|
|
{ if (p^.oper[1].typ = top_ref) or }
|
|
{ ((p^.oper[1].typ = top_reg) and }
|
|
{ is_reg_var[reg32(p^.oper[1].reg)]) then }
|
|
for regCounter := R_EAX to R_EDI do
|
|
if writeDestroysContents(p^.oper[1],regCounter,c[regCounter]) then
|
|
begin
|
|
exclude(regsStillValid,regCounter);
|
|
modifiesConflictingMemLocation := not(reg in regsStillValid);
|
|
end;
|
|
Ch_MOp3,CH_WOp3,CH_RWOp3:
|
|
{ if (p^.oper[2].typ = top_ref) or }
|
|
{ ((p^.oper[2].typ = top_reg) and }
|
|
{ is_reg_var[reg32(p^.oper[2].reg)]) then }
|
|
for regCounter := R_EAX to R_EDI do
|
|
if writeDestroysContents(p^.oper[2],regCounter,c[regCounter]) then
|
|
begin
|
|
exclude(regsStillValid,regCounter);
|
|
modifiesConflictingMemLocation := not(reg in regsStillValid);
|
|
end;
|
|
Ch_WMemEDI:
|
|
begin
|
|
fillchar(tmpref,sizeof(tmpref),0);
|
|
tmpRef.base := R_EDI;
|
|
tmpRef.index := R_EDI;
|
|
for regCounter := R_EAX to R_EDI do
|
|
if writeToMemDestroysContents(R_NO,tmpRef,regCounter,c[regCounter]) then
|
|
begin
|
|
exclude(regsStillValid,regCounter);
|
|
modifiesConflictingMemLocation := not(reg in regsStillValid);
|
|
end;
|
|
end;
|
|
end;
|
|
end;
|
|
end;
|
|
|
|
function getPrevSequence(p: pai; reg: tregister; currentPrev: pai; var newPrev: pai;
|
|
var passedJump: boolean; var regsNotRead, regsStillValid: tregset): tregister;
|
|
|
|
const
|
|
current_reg: tregister = R_NO;
|
|
|
|
function stillValid(p: pai): boolean;
|
|
begin
|
|
stillValid :=
|
|
(p^.typ = ait_instruction) and
|
|
(paicpu(p)^.opcode <> a_jmp) and
|
|
(ppaiprop(p^.optinfo)^.regs[reg].wstate =
|
|
ppaiprop(currentPrev^.optinfo)^.regs[reg].wstate) and
|
|
{ in case destroyreg is called with doIncState = false }
|
|
(ppaiprop(p^.optinfo)^.regs[reg].typ =
|
|
ppaiprop(currentPrev^.optinfo)^.regs[reg].typ) and
|
|
(reg in (regsNotRead * regsStillValid));
|
|
passedJump :=
|
|
(p^.typ = ait_instruction) and
|
|
(paicpu(p)^.is_jmp);
|
|
end;
|
|
|
|
function findChangedRegister(p: pai): tregister;
|
|
var
|
|
regCounter: tregister;
|
|
begin
|
|
for regCounter := succ(current_reg) to R_EDI do
|
|
with ppaiprop(p^.optinfo)^.regs[regCounter] do
|
|
if ((startmod <>
|
|
ppaiprop(currentPrev^.optinfo)^.regs[regCounter].startmod) or
|
|
(nrOfMods <>
|
|
ppaiprop(currentPrev^.optinfo)^.regs[regCounter].nrOfMods)) and
|
|
(ppaiprop(p^.optinfo)^.regs[regCounter].typ in
|
|
[con_ref,con_noRemoveRef]) then
|
|
begin
|
|
findChangedRegister := regCounter;
|
|
current_reg := regCounter;
|
|
exit;
|
|
end;
|
|
current_reg := R_NO;
|
|
findChangedRegister := R_NO;
|
|
end;
|
|
|
|
var
|
|
hp, prevFound: pai;
|
|
tmpResult, regCounter: tregister;
|
|
begin
|
|
if not(current_reg in [R_NO,R_EDI]) then
|
|
begin
|
|
tmpResult := findChangedRegister(currentPrev);
|
|
if tmpResult <> R_NO then
|
|
begin
|
|
getPrevSequence := tmpResult;
|
|
exit;
|
|
end;
|
|
end;
|
|
|
|
getPrevSequence := R_NO;
|
|
passedJump := passedJump or
|
|
((currentPrev^.typ = ait_instruction) and
|
|
(paicpu(currentPrev)^.is_jmp));
|
|
|
|
if (passedJump and not(reg in (usableregs+[R_EDI]))) or
|
|
not getLastInstruction(currentPrev,hp) then
|
|
exit;
|
|
|
|
prevFound := currentPrev;
|
|
tmpResult := R_NO;
|
|
|
|
while (tmpResult = R_NO) and
|
|
stillValid(hp) and
|
|
not(modifiesConflictingMemLocation(prevFound,reg,
|
|
ppaiprop(p^.optinfo)^.regs,regsStillValid)) do
|
|
begin
|
|
{ only update the regsread for the instructions we already passed }
|
|
if not(ppaiprop(prevFound^.optinfo)^.canBeRemoved) then
|
|
for regCounter := R_EAX to R_EDI do
|
|
if regReadByInstruction(regCounter,prevFound) then
|
|
exclude(regsNotRead,regCounter);
|
|
|
|
{ in case getPreviousInstruction fails and sets hp to nil in the }
|
|
{ next iteration }
|
|
prevFound := hp;
|
|
if not(ppaiprop(hp^.optinfo)^.canBeRemoved) then
|
|
tmpResult := findChangedRegister(hp);
|
|
if { do not load the self pointer or a regvar before a (conditional) }
|
|
{ jump with a new value, since if the jump is taken, the old value }
|
|
{ is (probably) still necessary }
|
|
(passedJump and not(reg in (usableregs+[R_EDI]))) or
|
|
not getLastInstruction(hp,hp) then
|
|
break;
|
|
end;
|
|
getPrevSequence := tmpResult;
|
|
if tmpResult <> R_NO then
|
|
newPrev := prevFound;
|
|
end;
|
|
|
|
|
|
function isSimpleMemLoc(const ref: treference): boolean;
|
|
begin
|
|
isSimpleMemLoc :=
|
|
(ref.index = R_NO) and
|
|
(not(ref.base in (usableregs+[R_EDI])) or
|
|
(assigned(ref.symbol) and
|
|
(ref.base = R_NO) and
|
|
(ref.index = R_NO)));
|
|
end;
|
|
|
|
|
|
{checks whether the current instruction sequence (starting with p) and the
|
|
one between StartMod and EndMod of Reg are the same. If so, the number of
|
|
instructions that match is stored in Found and true is returned, otherwise
|
|
Found holds the number of instructions between StartMod and EndMod and false
|
|
is returned}
|
|
Function CheckSequence(p: Pai; var prev: pai; Reg: TRegister; Var Found: Longint;
|
|
Var RegInfo: TRegInfo; findPrevSeqs: boolean): Boolean;
|
|
|
|
const
|
|
checkingPrevSequences: boolean = false;
|
|
var
|
|
regsNotRead, regsStillValid: tregset;
|
|
|
|
function getNextRegToTest(var prev: pai; currentReg: tregister): tregister;
|
|
const
|
|
passedJump: boolean = false;
|
|
begin
|
|
if not checkingPrevSequences then
|
|
begin
|
|
Repeat
|
|
Inc(currentReg);
|
|
Until (currentReg > R_EDI) or
|
|
(ppaiprop(prev^.optInfo)^.regs[currentReg].typ
|
|
in [con_ref,con_noRemoveRef]);
|
|
if currentReg > R_EDI then
|
|
begin
|
|
if (paicpu(p)^.oper[0].typ <> top_ref) or
|
|
isSimpleMemLoc(paicpu(p)^.oper[0].ref^) then
|
|
begin
|
|
checkingPrevSequences := true;
|
|
passedJump := false;
|
|
end
|
|
else
|
|
getNextRegToTest := R_NO;
|
|
end
|
|
else getNextRegToTest := currentReg;
|
|
end;
|
|
if checkingPrevSequences then
|
|
if findPrevSeqs then
|
|
getNextRegToTest :=
|
|
getPrevSequence(p,reg,prev,prev,passedJump,regsNotRead,RegsStillValid)
|
|
else
|
|
getNextRegToTest := R_NO;
|
|
end;
|
|
|
|
Var hp2, hp3{, EndMod},highPrev, orgPrev: Pai;
|
|
{Cnt,} OldNrOfMods: Longint;
|
|
startRegInfo, OrgRegInfo, HighRegInfo: TRegInfo;
|
|
regModified: array[R_NO..R_EDI] of boolean;
|
|
HighFound, OrgRegFound: Byte;
|
|
RegCounter, regCounter2, tmpreg: TRegister;
|
|
OrgRegResult: Boolean;
|
|
TmpResult: Boolean;
|
|
{TmpState: Byte;}
|
|
Begin {CheckSequence}
|
|
Reg := Reg32(Reg);
|
|
TmpResult := False;
|
|
FillChar(OrgRegInfo, SizeOf(OrgRegInfo), 0);
|
|
FillChar(startRegInfo, sizeof(startRegInfo), 0);
|
|
OrgRegFound := 0;
|
|
HighFound := 0;
|
|
OrgRegResult := False;
|
|
with startRegInfo do
|
|
begin
|
|
newRegsEncountered := [procinfo^.FramePointer, stack_pointer];
|
|
new2OldReg[procinfo^.FramePointer] := procinfo^.FramePointer;
|
|
new2OldReg[stack_pointer] := stack_pointer;
|
|
oldRegsEncountered := newRegsEncountered;
|
|
end;
|
|
|
|
checkingPrevSequences := false;
|
|
regsNotRead := [R_EAX,R_EBX,R_ECX,R_EDX,R_ESP,R_EBP,R_EDI,R_ESI];
|
|
regsStillValid := regsNotRead;
|
|
GetLastInstruction(p, prev);
|
|
regCounter := getNextRegToTest(prev,R_NO);
|
|
While (RegCounter <> R_NO) Do
|
|
Begin
|
|
fillchar(regModified,sizeof(regModified),0);
|
|
regInfo := startRegInfo;
|
|
Found := 0;
|
|
hp2 := PPaiProp(prev^.OptInfo)^.Regs[RegCounter].StartMod;
|
|
If (prev <> PPaiProp(prev^.OptInfo)^.Regs[RegCounter].StartMod)
|
|
Then OldNrOfMods := PPaiProp(prev^.OptInfo)^.Regs[RegCounter].NrOfMods
|
|
Else OldNrOfMods := 1;
|
|
hp3 := p;
|
|
While (Found <> OldNrOfMods) And
|
|
{ old new }
|
|
InstructionsEquivalent(hp2, hp3, RegInfo) Do
|
|
Begin
|
|
if (hp3^.typ = ait_instruction) and
|
|
((paicpu(hp3)^.opcode = A_MOV) or
|
|
(paicpu(hp3)^.opcode = A_MOVZX) or
|
|
(paicpu(hp3)^.opcode = A_MOVSX)) and
|
|
(paicpu(hp3)^.oper[1].typ = top_reg) and
|
|
not(regInOp(paicpu(hp3)^.oper[1].reg,
|
|
paicpu(hp3)^.oper[0])) then
|
|
begin
|
|
tmpreg := reg32(paicpu(hp3)^.oper[1].reg);
|
|
regInfo.lastReload[tmpreg] := hp3;
|
|
case paicpu(hp3)^.oper[0].typ of
|
|
top_ref:
|
|
begin
|
|
if regModified[reg32(paicpu(hp3)^.oper[0].ref^.base)] then
|
|
with ppaiprop(hp3^.optinfo)^.regs[tmpreg] do
|
|
if nrOfMods > (oldNrOfMods - found) then
|
|
oldNrOfMods := found + nrOfMods;
|
|
if regModified[reg32(paicpu(hp3)^.oper[0].ref^.index)] then
|
|
with ppaiprop(hp3^.optinfo)^.regs[tmpreg] do
|
|
if nrOfMods > (oldNrOfMods - found) then
|
|
oldNrOfMods := found + nrOfMods;
|
|
end;
|
|
top_reg:
|
|
if regModified[reg32(paicpu(hp3)^.oper[0].reg)] then
|
|
with ppaiprop(hp3^.optinfo)^.regs[tmpreg] do
|
|
if nrOfMods > (oldNrOfMods - found) then
|
|
oldNrOfMods := found + nrOfMods;
|
|
end;
|
|
end;
|
|
for regCounter2 := R_EAX to R_EDI do
|
|
regModified[regCounter2] := regModified[regCounter2] or
|
|
regModifiedByInstruction(regCounter2,hp3);
|
|
GetNextInstruction(hp2, hp2);
|
|
GetNextInstruction(hp3, hp3);
|
|
Inc(Found)
|
|
End;
|
|
|
|
for regCounter2 := R_EAX to R_EDI do
|
|
if (regInfo.new2OldReg[regCounter2] <> R_NO) and
|
|
(regCounter2 in PPaiProp(hp3^.optInfo)^.usedRegs) and
|
|
not regLoadedWithNewValue(regCounter2,false,hp3) then
|
|
include(regInfo.regsStillUsedAfterSeq,regCounter2);
|
|
|
|
if checkingPrevSequences then
|
|
for regCounter2 := R_EAX to R_EDI do
|
|
if not(regInfo.new2OldReg[regCounter2] in [R_NO,regCounter2]) and
|
|
(not(regCounter2 in (regsNotRead * regsStillValid)) or
|
|
not(regInfo.new2OldReg[regCounter2] in regsStillValid)) then
|
|
begin
|
|
found := 0;
|
|
break;
|
|
end;
|
|
|
|
If (Found <> OldNrOfMods) or
|
|
{ the following is to avoid problems with rangecheck code (see testcse2) }
|
|
(assigned(hp3) and
|
|
((reg in regInfo.regsLoadedForRef) and
|
|
(reg in PPaiProp(hp3^.optInfo)^.usedRegs) and
|
|
not regLoadedWithNewValue(reg,false,hp3))) then
|
|
Begin
|
|
TmpResult := False;
|
|
If (found > 0) then
|
|
{this is correct because we only need to turn off the CanBeRemoved flag
|
|
when an instruction has already been processed by CheckSequence
|
|
(otherwise CanBeRemoved can't be true and thus can't have to be turned off).
|
|
If it has already been processed by CheckSequence and flagged to be
|
|
removed, it means that it has been checked against a previous sequence
|
|
and that it was equal (otherwise CheckSequence would have returned false
|
|
and the instruction wouldn't have been removed). If this "If found > 0"
|
|
check is left out, incorrect optimizations are performed.}
|
|
Found := PPaiProp(Pai(p)^.OptInfo)^.Regs[Reg].NrOfMods
|
|
End
|
|
Else TmpResult := True;
|
|
If TmpResult And
|
|
(Found > HighFound)
|
|
Then
|
|
Begin
|
|
highPrev := prev;
|
|
HighFound := Found;
|
|
HighRegInfo := RegInfo;
|
|
End;
|
|
If (RegCounter = Reg) Then
|
|
Begin
|
|
orgPrev := prev;
|
|
OrgRegFound := Found;
|
|
OrgRegResult := TmpResult;
|
|
OrgRegInfo := RegInfo
|
|
End;
|
|
regCounter := getNextRegToTest(prev,regCounter);
|
|
End;
|
|
If (HighFound > 0) And
|
|
(Not(OrgRegResult) Or
|
|
(HighFound > OrgRegFound))
|
|
Then
|
|
Begin
|
|
{$ifndef fpc}
|
|
TmpResult := True;
|
|
{$else fpc}
|
|
CheckSequence := True;
|
|
{$endif fpc}
|
|
prev := highPrev;
|
|
RegInfo := HighRegInfo;
|
|
Found := HighFound
|
|
End
|
|
Else
|
|
Begin
|
|
{$ifndef fpc}
|
|
TmpResult := OrgRegResult;
|
|
{$else fpc}
|
|
CheckSequence := OrgRegResult;
|
|
{$endif fpc}
|
|
prev := orgPrev;
|
|
Found := OrgRegFound;
|
|
RegInfo := OrgRegInfo;
|
|
End;
|
|
{$ifndef fpc}
|
|
CheckSequence := TmpResult;
|
|
{$endif fpc}
|
|
End; {CheckSequence}
|
|
|
|
Procedure SetAlignReg(p: Pai);
|
|
Const alignSearch = 12;
|
|
var regsUsable: TRegSet;
|
|
prevInstrCount, nextInstrCount: Longint;
|
|
prevState, nextWState,nextRState: Array[R_EAX..R_EDI] of byte;
|
|
regCounter, lastRemoved: TRegister;
|
|
prev, next: Pai;
|
|
{$ifdef alignregdebug}
|
|
temp: Pai;
|
|
{$endif alignregdebug}
|
|
begin
|
|
regsUsable := [R_EAX,R_ECX,R_EDX,R_EBX,{R_ESP,R_EBP,}R_ESI,R_EDI];
|
|
for regCounter := R_EAX to R_EDI do
|
|
begin
|
|
prevState[regCounter] := PPaiProp(p^.optInfo)^.Regs[regCounter].wState;
|
|
nextWState[regCounter] := PPaiProp(p^.optInfo)^.Regs[regCounter].wState;
|
|
nextRState[regCounter] := PPaiProp(p^.optInfo)^.Regs[regCounter].rState;
|
|
end;
|
|
getLastInstruction(p,prev);
|
|
getNextInstruction(p,next);
|
|
lastRemoved := pai_align(p)^.reg;
|
|
nextInstrCount := 0;
|
|
prevInstrCount := 0;
|
|
while ((assigned(prev) and
|
|
assigned(prev^.optInfo) and
|
|
(prevInstrCount < alignSearch)) or
|
|
(assigned(next) and
|
|
assigned(next^.optInfo) and
|
|
(nextInstrCount < alignSearch))) And
|
|
(regsUsable <> []) do
|
|
begin
|
|
{$ifdef alignregdebug}
|
|
if assigned(prev) then
|
|
begin
|
|
temp := new(pai_asm_comment,init(strpnew('got here')));
|
|
temp^.next := prev^.next;
|
|
temp^.previous := prev;
|
|
prev^.next := temp;
|
|
if assigned(temp^.next) then
|
|
temp^.next^.previous := temp;
|
|
end;
|
|
{$endif alignregdebug}
|
|
if assigned(prev) and assigned(prev^.optinfo) and
|
|
(prevInstrCount < alignSearch) then
|
|
begin
|
|
if (prev^.typ = ait_instruction) And
|
|
(insProp[PaiCpu(prev)^.opcode].ch[1] <> Ch_ALL) and
|
|
(PaiCpu(prev)^.opcode <> A_JMP) then
|
|
begin
|
|
inc(prevInstrCount);
|
|
for regCounter := R_EAX to R_EDI do
|
|
begin
|
|
if (regCounter in regsUsable) And
|
|
(PPaiProp(prev^.optInfo)^.Regs[regCounter].wState <>
|
|
prevState[regCounter]) then
|
|
begin
|
|
lastRemoved := regCounter;
|
|
exclude(regsUsable,regCounter);
|
|
{$ifdef alignregdebug}
|
|
temp := new(pai_asm_comment,init(strpnew(
|
|
att_reg2str[regCounter]+' removed')));
|
|
temp^.next := prev^.next;
|
|
temp^.previous := prev;
|
|
prev^.next := temp;
|
|
if assigned(temp^.next) then
|
|
temp^.next^.previous := temp;
|
|
if regsUsable = [] then
|
|
begin
|
|
temp := new(pai_asm_comment,init(strpnew(
|
|
'regsUsable empty here')));
|
|
temp^.next := prev^.next;
|
|
temp^.previous := prev;
|
|
prev^.next := temp;
|
|
if assigned(temp^.next) then
|
|
temp^.next^.previous := temp;
|
|
end;
|
|
{$endif alignregdebug}
|
|
end;
|
|
prevState[regCounter] :=
|
|
PPaiProp(prev^.optInfo)^.Regs[regCounter].wState;
|
|
end;
|
|
getLastInstruction(prev,prev);
|
|
end
|
|
else
|
|
If GetLastInstruction(prev,prev) and
|
|
assigned(prev^.optinfo) then
|
|
for regCounter := R_EAX to R_EDI do
|
|
prevState[regCounter] :=
|
|
PPaiProp(prev^.optInfo)^.Regs[regCounter].wState
|
|
end;
|
|
if assigned(next) and assigned(next^.optInfo) and
|
|
(nextInstrCount < alignSearch) then
|
|
begin
|
|
if (next^.typ = ait_instruction) and
|
|
(insProp[PaiCpu(next)^.opcode].ch[1] <> Ch_ALL) and
|
|
(PaiCpu(next)^.opcode <> A_JMP) then
|
|
begin
|
|
inc(nextInstrCount);
|
|
for regCounter := R_EAX to R_EDI do
|
|
begin
|
|
if (regCounter in regsUsable) And
|
|
((PPaiProp(next^.optInfo)^.Regs[regCounter].wState <>
|
|
nextWState[regCounter]) or
|
|
(PPaiProp(next^.optInfo)^.Regs[regCounter].rState <>
|
|
nextRState[regCounter])) Then
|
|
begin
|
|
lastRemoved := regCounter;
|
|
exclude(regsUsable,regCounter);
|
|
{$ifdef alignregdebug}
|
|
temp := new(pai_asm_comment,init(strpnew(
|
|
att_reg2str[regCounter]+' removed')));
|
|
temp^.next := next^.next;
|
|
temp^.previous := next;
|
|
next^.next := temp;
|
|
if assigned(temp^.next) then
|
|
temp^.next^.previous := temp;
|
|
if regsUsable = [] then
|
|
begin
|
|
temp := new(pai_asm_comment,init(strpnew(
|
|
'regsUsable empty here')));
|
|
temp^.next := next^.next;
|
|
temp^.previous := next;
|
|
next^.next := temp;
|
|
if assigned(temp^.next) then
|
|
temp^.next^.previous := temp;
|
|
end;
|
|
{$endif alignregdebug}
|
|
end;
|
|
nextWState[regCounter] :=
|
|
PPaiProp(next^.optInfo)^.Regs[regCounter].wState;
|
|
nextRState[regCounter] :=
|
|
PPaiProp(next^.optInfo)^.Regs[regCounter].rState;
|
|
end
|
|
end
|
|
else
|
|
for regCounter := R_EAX to R_EDI do
|
|
begin
|
|
nextWState[regCounter] :=
|
|
PPaiProp(next^.optInfo)^.Regs[regCounter].wState;
|
|
nextRState[regCounter] :=
|
|
PPaiProp(next^.optInfo)^.Regs[regCounter].rState;
|
|
end;
|
|
getNextInstruction(next,next);
|
|
end;
|
|
end;
|
|
if regsUsable <> [] then
|
|
for regCounter := R_EAX to R_EDI do
|
|
if regCounter in regsUsable then
|
|
begin
|
|
lastRemoved := regCounter;
|
|
break
|
|
end;
|
|
{$ifdef alignregdebug}
|
|
next := new(pai_asm_comment,init(strpnew(att_reg2str[lastRemoved]+
|
|
' chosen as alignment register')));
|
|
next^.next := p^.next;
|
|
next^.previous := p;
|
|
p^.next := next;
|
|
if assigned(next^.next) then
|
|
next^.next^.previous := next;
|
|
{$endif alignregdebug}
|
|
pai_align(p)^.reg := lastRemoved;
|
|
End;
|
|
|
|
Procedure RestoreRegContentsTo(reg: TRegister; const c: TContent; p, endP: pai);
|
|
var
|
|
{$ifdef replaceregdebug}
|
|
hp: pai;
|
|
l: longint;
|
|
{$endif replaceregdebug}
|
|
tmpState: byte;
|
|
begin
|
|
{$ifdef replaceregdebug}
|
|
l := random(1000);
|
|
hp := new(pai_asm_comment,init(strpnew(
|
|
'restored '+att_reg2str[reg]+' with data from here... '+tostr(l))));
|
|
hp^.next := p;
|
|
hp^.previous := p^.previous;
|
|
p^.previous := hp;
|
|
if assigned(hp^.previous) then
|
|
hp^.previous^.next := hp;
|
|
{$endif replaceregdebug}
|
|
{ PPaiProp(p^.optInfo)^.Regs[reg] := c;}
|
|
While (p <> endP) Do
|
|
Begin
|
|
PPaiProp(p^.optInfo)^.Regs[reg] := c;
|
|
getNextInstruction(p,p);
|
|
end;
|
|
tmpState := PPaiProp(p^.optInfo)^.Regs[reg].wState;
|
|
repeat
|
|
PPaiProp(p^.optInfo)^.Regs[reg] := c;
|
|
until not getNextInstruction(p,p) or
|
|
(PPaiProp(p^.optInfo)^.Regs[reg].wState <> tmpState);
|
|
{$ifdef replaceregdebug}
|
|
if assigned(p) then
|
|
begin
|
|
hp := new(pai_asm_comment,init(strpnew(
|
|
'restored '+att_reg2str[reg]+' till here... '+tostr(l))));
|
|
hp^.next := p;
|
|
hp^.previous := p^.previous;
|
|
p^.previous := hp;
|
|
if assigned(hp^.previous) then
|
|
hp^.previous^.next := hp;
|
|
end;
|
|
{$endif replaceregdebug}
|
|
end;
|
|
|
|
|
|
Procedure ClearRegContentsFrom(reg: TRegister; p, endP: pai);
|
|
{ first clears the contents of reg from p till endP. Then the contents are }
|
|
{ cleared until the first instruction that changes reg }
|
|
var
|
|
{$ifdef replaceregdebug}
|
|
hp: pai;
|
|
l: longint;
|
|
{$endif replaceregdebug}
|
|
oldStartmod: pai;
|
|
begin
|
|
{$ifdef replaceregdebug}
|
|
l := random(1000);
|
|
hp := new(pai_asm_comment,init(strpnew(
|
|
'cleared '+att_reg2str[reg]+' from here... '+tostr(l))));
|
|
hp^.next := p;
|
|
hp^.previous := p^.previous;
|
|
p^.previous := hp;
|
|
if assigned(hp^.previous) then
|
|
hp^.previous^.next := hp;
|
|
{$endif replaceregdebug}
|
|
PPaiProp(p^.optInfo)^.Regs[reg].typ := con_unknown;
|
|
While (p <> endP) Do
|
|
Begin
|
|
PPaiProp(p^.optInfo)^.Regs[reg].typ := con_unknown;
|
|
getNextInstruction(p,p);
|
|
end;
|
|
oldStartmod := PPaiProp(p^.optInfo)^.Regs[reg].startmod;
|
|
repeat
|
|
PPaiProp(p^.optInfo)^.Regs[reg].typ := con_unknown;
|
|
until not getNextInstruction(p,p) or
|
|
(PPaiProp(p^.optInfo)^.Regs[reg].startmod <> oldStartmod);
|
|
{$ifdef replaceregdebug}
|
|
if assigned(p) then
|
|
begin
|
|
hp := new(pai_asm_comment,init(strpnew(
|
|
'cleared '+att_reg2str[reg]+' till here... '+tostr(l))));
|
|
hp^.next := p;
|
|
hp^.previous := p^.previous;
|
|
p^.previous := hp;
|
|
if assigned(hp^.previous) then
|
|
hp^.previous^.next := hp;
|
|
end;
|
|
{$endif replaceregdebug}
|
|
end;
|
|
|
|
function NoHardCodedRegs(p: paicpu; orgReg, newReg: TRegister): boolean;
|
|
var chCount: byte;
|
|
begin
|
|
case p^.opcode of
|
|
A_IMUL: noHardCodedRegs := p^.ops <> 1;
|
|
A_SHL,A_SHR,A_SHLD,A_SHRD: noHardCodedRegs :=
|
|
(p^.oper[0].typ <> top_reg) or
|
|
((orgReg <> R_ECX) and (newReg <> R_ECX));
|
|
else
|
|
begin
|
|
NoHardCodedRegs := true;
|
|
with InsProp[p^.opcode] do
|
|
for chCount := 1 to MaxCh do
|
|
if Ch[chCount] in ([Ch_REAX..Ch_MEDI,Ch_WMemEDI,Ch_All]-[Ch_RESP,Ch_WESP,Ch_RWESP]) then
|
|
begin
|
|
NoHardCodedRegs := false;
|
|
break
|
|
end;
|
|
end;
|
|
end;
|
|
end;
|
|
|
|
function ChangeReg(var Reg: TRegister; newReg, orgReg: TRegister): boolean;
|
|
begin
|
|
changeReg := true;
|
|
if reg = newReg then
|
|
reg := orgReg
|
|
else if reg = regtoreg8(newReg) then
|
|
reg := regtoreg8(orgReg)
|
|
else if reg = regtoreg16(newReg) then
|
|
reg := regtoreg16(orgReg)
|
|
else changeReg := false;
|
|
end;
|
|
|
|
function changeOp(var o: toper; newReg, orgReg: tregister): boolean;
|
|
begin
|
|
case o.typ of
|
|
top_reg: changeOp := changeReg(o.reg,newReg,orgReg);
|
|
top_ref:
|
|
begin
|
|
changeOp :=
|
|
changeReg(o.ref^.base,newReg,orgReg) or
|
|
changeReg(o.ref^.index,newReg,orgReg);
|
|
end;
|
|
end;
|
|
end;
|
|
|
|
procedure updateStates(orgReg,newReg: tregister; hp: pai; writeStateToo: boolean);
|
|
var
|
|
prev: pai;
|
|
newOrgRegRState, newOrgRegWState: byte;
|
|
begin
|
|
if getLastInstruction(hp,prev) then
|
|
with ppaiprop(prev^.optinfo)^ do
|
|
begin
|
|
newOrgRegRState := regs[orgReg].rState +
|
|
ppaiprop(hp^.optinfo)^.regs[newReg].rState - regs[newReg].rstate;
|
|
if writeStateToo then
|
|
newOrgRegWState := regs[orgReg].wState +
|
|
ppaiprop(hp^.optinfo)^.regs[newReg].wState - regs[newReg].wstate;
|
|
end
|
|
else
|
|
with ppaiprop(hp^.optinfo)^.regs[newReg] do
|
|
begin
|
|
newOrgRegRState := rState;
|
|
if writeStateToo then
|
|
newOrgRegWState := wState;
|
|
end;
|
|
with ppaiprop(hp^.optinfo)^.regs[orgReg] do
|
|
begin
|
|
rState := newOrgRegRState;
|
|
if writeStateToo then
|
|
wState := newOrgRegwState;
|
|
end;
|
|
end;
|
|
|
|
function doReplaceReg(hp: paicpu; newReg, orgReg: tregister): boolean;
|
|
var
|
|
opCount: longint;
|
|
tmpResult: boolean;
|
|
begin
|
|
for opCount := 0 to hp^.ops-1 do
|
|
tmpResult :=
|
|
changeOp(hp^.oper[opCount],newReg,orgReg) or tmpResult;
|
|
doReplaceReg := tmpResult;
|
|
end;
|
|
|
|
function RegSizesOK(oldReg,newReg: TRegister; p: paicpu): boolean;
|
|
{ oldreg and newreg must be 32bit components }
|
|
var opCount: byte;
|
|
begin
|
|
RegSizesOK := true;
|
|
{ if only one of them is a general purpose register ... }
|
|
if (IsGP32reg(oldReg) xor IsGP32Reg(newReg)) then
|
|
begin
|
|
for opCount := 0 to 2 do
|
|
if (p^.oper[opCount].typ = top_reg) and
|
|
(p^.oper[opCount].reg in [R_AL..R_DH]) then
|
|
begin
|
|
RegSizesOK := false;
|
|
break
|
|
end
|
|
end;
|
|
end;
|
|
|
|
function doReplaceReadReg(p: paicpu; newReg,orgReg: tregister): boolean;
|
|
var opCount: byte;
|
|
begin
|
|
doReplaceReadReg := false;
|
|
{ handle special case }
|
|
case p^.opcode of
|
|
A_IMUL:
|
|
begin
|
|
case p^.ops of
|
|
1: internalerror(1301001);
|
|
2,3:
|
|
begin
|
|
if changeOp(p^.oper[0],newReg,orgReg) then
|
|
begin
|
|
{ updateStates(orgReg,newReg,p,false);}
|
|
doReplaceReadReg := true;
|
|
end;
|
|
if p^.ops = 3 then
|
|
if changeOp(p^.oper[1],newReg,orgReg) then
|
|
begin
|
|
{ updateStates(orgReg,newReg,p,false);}
|
|
doReplaceReadReg := true;
|
|
end;
|
|
end;
|
|
end;
|
|
end;
|
|
A_DIV,A_IDIV,A_MUL: internalerror(1301002);
|
|
else
|
|
begin
|
|
for opCount := 0 to 2 do
|
|
if p^.oper[opCount].typ = top_ref then
|
|
if changeOp(p^.oper[opCount],newReg,orgReg) then
|
|
begin
|
|
{ updateStates(orgReg,newReg,p,false);}
|
|
doReplaceReadReg := true;
|
|
end;
|
|
for opCount := 1 to MaxCh do
|
|
case InsProp[p^.opcode].Ch[opCount] of
|
|
Ch_ROp1:
|
|
if p^.oper[0].typ = top_reg then
|
|
if changeReg(p^.oper[0].reg,newReg,orgReg) then
|
|
begin
|
|
{ updateStates(orgReg,newReg,p,false);}
|
|
doReplaceReadReg := true;
|
|
end;
|
|
Ch_ROp2:
|
|
if p^.oper[1].typ = top_reg then
|
|
if changeReg(p^.oper[1].reg,newReg,orgReg) then
|
|
begin
|
|
{ updateStates(orgReg,newReg,p,false);}
|
|
doReplaceReadReg := true;
|
|
end;
|
|
Ch_ROp3:
|
|
if p^.oper[2].typ = top_reg then
|
|
if changeReg(p^.oper[2].reg,newReg,orgReg) then
|
|
begin
|
|
{ updateStates(orgReg,newReg,p,false);}
|
|
doReplaceReadReg := true;
|
|
end;
|
|
end;
|
|
end;
|
|
end;
|
|
end;
|
|
|
|
|
|
procedure updateState(reg: tregister; p: pai);
|
|
{ this procedure updates the read and write states of the instructions }
|
|
{ coming after p. It's called when the read/write state of p has been }
|
|
{ changed and this change has to be propagated to the following }
|
|
{ instructions as well }
|
|
var
|
|
newRState, newWState: byte;
|
|
prevRState, prevWState: byte;
|
|
doRState, doWState: boolean;
|
|
begin
|
|
{ get the new read/write states from p }
|
|
with ppaiprop(p^.optinfo)^.regs[reg] do
|
|
begin
|
|
newRState := rState;
|
|
newWState := wState;
|
|
end;
|
|
if not GetNextInstruction(p,p) then
|
|
exit;
|
|
{ get the old read/write states from the next instruction, to know }
|
|
{ when we can stop updating }
|
|
with ppaiprop(p^.optinfo)^.regs[reg] do
|
|
begin
|
|
prevRState := rState;
|
|
prevWState := wState;
|
|
end;
|
|
{ adjust the states if this next instruction reads/writes the register }
|
|
if regReadByInstruction(reg,p) then
|
|
incState(newRState,1);
|
|
if regModifiedByInstruction(reg,p) then
|
|
incState(newWState,1);
|
|
{ do we still have to update the read and/or write states? }
|
|
doRState := true;
|
|
doWState := true;
|
|
repeat
|
|
{ update the states }
|
|
with ppaiprop(p^.optinfo)^.regs[reg] do
|
|
begin
|
|
if doRState then
|
|
rState := newRState;
|
|
if doWState then
|
|
wState := newWState;
|
|
end;
|
|
if not getNextInstruction(p,p) then
|
|
break;
|
|
with ppaiprop(p^.optinfo)^.regs[reg] do
|
|
begin
|
|
{ stop updating the read state if it changes }
|
|
doRState :=
|
|
doRState and (rState = prevRState);
|
|
{ if, by accident, this changed state is the same as the one }
|
|
{ we've been using, change it to a value that's definitely }
|
|
{ different from the previous and next state }
|
|
if not doRState and
|
|
(rState = newRState) then
|
|
begin
|
|
incState(newRState,1);
|
|
prevRState := rState;
|
|
doRState := true;
|
|
end;
|
|
{ ditto for the write state }
|
|
doWState :=
|
|
doWState and (WState = prevWState);
|
|
if not doWState and
|
|
(wState = newWState) then
|
|
begin
|
|
incState(newWState,1);
|
|
prevWState := wState;
|
|
doWState := true;
|
|
end;
|
|
end;
|
|
{ stop when we don't have to update either state anymore }
|
|
until not(doRState or doWState);
|
|
end;
|
|
|
|
|
|
function storeBack(p1: pai; orgReg, newReg: tregister): boolean;
|
|
{ returns true if p1 contains an instruction that stores the contents }
|
|
{ of newReg back to orgReg }
|
|
begin
|
|
storeBack :=
|
|
(p1^.typ = ait_instruction) and
|
|
(paicpu(p1)^.opcode = A_MOV) and
|
|
(paicpu(p1)^.oper[0].typ = top_reg) and
|
|
(paicpu(p1)^.oper[0].reg = newReg) and
|
|
(paicpu(p1)^.oper[1].typ = top_reg) and
|
|
(paicpu(p1)^.oper[1].reg = orgReg);
|
|
end;
|
|
|
|
|
|
function ReplaceReg(asmL: PaasmOutput; orgReg, newReg: TRegister; p: pai;
|
|
const c: TContent; orgRegCanBeModified: Boolean;
|
|
var returnEndP: pai): Boolean;
|
|
{ Tries to replace orgreg with newreg in all instructions coming after p }
|
|
{ until orgreg gets loaded with a new value. Returns true if successful, }
|
|
{ false otherwise. If successful, the contents of newReg are set to c, }
|
|
{ which should hold the contents of newReg before the current sequence }
|
|
{ started }
|
|
{ if the function returns true, returnEndP holds the last instruction }
|
|
{ where newReg was replaced by orgReg }
|
|
var endP, hp: Pai;
|
|
removeLast, sequenceEnd, tmpResult, newRegModified, orgRegRead,
|
|
stateChanged, readStateChanged: Boolean;
|
|
|
|
|
|
begin
|
|
ReplaceReg := false;
|
|
tmpResult := true;
|
|
sequenceEnd := false;
|
|
newRegModified := false;
|
|
orgRegRead := false;
|
|
removeLast := false;
|
|
endP := p;
|
|
while tmpResult and not sequenceEnd do
|
|
begin
|
|
tmpResult :=
|
|
getNextInstruction(endP,endP) and
|
|
(endP^.typ = ait_instruction);
|
|
if tmpresult and not assigned(endP^.optInfo) then
|
|
begin
|
|
{ hp := new(pai_asm_comment,init(strpnew('next no optinfo')));
|
|
hp^.next := endp;
|
|
hp^.previous := endp^.previous;
|
|
endp^.previous := hp;
|
|
if assigned(hp^.previous) then
|
|
hp^.previous^.next := hp;}
|
|
exit;
|
|
end;
|
|
If tmpResult and
|
|
{ don't take into account instructions that will be removed }
|
|
Not (PPaiProp(endP^.optInfo)^.canBeRemoved) then
|
|
begin
|
|
{ if the newReg gets stored back to the oldReg, we can change }
|
|
{ "mov %oldReg,%newReg; <operations on %newReg>; mov %newReg, }
|
|
{ %oldReg" to "<operations on %oldReg>" }
|
|
removeLast := storeBack(endP, orgReg, newReg);
|
|
sequenceEnd :=
|
|
{ no support for (i)div, mul and imul with hardcoded operands }
|
|
(noHardCodedRegs(paicpu(endP),orgReg,newReg) and
|
|
{ if newReg gets loaded with a new value, we can stop }
|
|
{ replacing newReg with oldReg here (possibly keeping }
|
|
{ the original contents of oldReg so we still know them }
|
|
{ afterwards) }
|
|
RegLoadedWithNewValue(newReg,true,paicpu(endP)) or
|
|
{ we can also stop if we reached the end of the use of }
|
|
{ newReg's current contents }
|
|
(GetNextInstruction(endp,hp) and
|
|
FindRegDealloc(newReg,hp)));
|
|
{ to be able to remove the first and last instruction of }
|
|
{ movl %reg1, %reg2 }
|
|
{ <operations on %reg2> (replacing reg2 with reg1 here) }
|
|
{ movl %reg2, %reg1 }
|
|
{ %reg2 must not be use afterwards (it can be as the }
|
|
{ result of a peepholeoptimization) }
|
|
removeLast := removeLast and sequenceEnd;
|
|
newRegModified :=
|
|
newRegModified or
|
|
(not(regLoadedWithNewValue(newReg,true,paicpu(endP))) and
|
|
RegModifiedByInstruction(newReg,endP));
|
|
orgRegRead := newRegModified and RegReadByInstruction(orgReg,endP);
|
|
sequenceEnd := SequenceEnd and
|
|
(removeLast or
|
|
{ since newReg will be replaced by orgReg, we can't allow that newReg }
|
|
{ gets modified if orgReg is still read afterwards (since after }
|
|
{ replacing, this would mean that orgReg first gets modified and then }
|
|
{ gets read in the assumption it still contains the unmodified value) }
|
|
not(newRegModified and orgRegRead)) (* and
|
|
{ since newReg will be replaced by orgReg, we can't allow that newReg }
|
|
{ gets modified if orgRegCanBeModified = false }
|
|
|
|
{ this now gets checked after the loop (JM) }
|
|
(orgRegCanBeModified or not(newRegModified)) *);
|
|
tmpResult :=
|
|
not(removeLast) and
|
|
not(newRegModified and orgRegRead) and
|
|
(* (orgRegCanBeModified or not(newRegModified)) and *)
|
|
(endP^.typ = ait_instruction) and
|
|
not(paicpu(endP)^.is_jmp) and
|
|
NoHardCodedRegs(paicpu(endP),orgReg,newReg) and
|
|
RegSizesOk(orgReg,newReg,paicpu(endP)) and
|
|
not RegModifiedByInstruction(orgReg,endP);
|
|
end;
|
|
end;
|
|
sequenceEnd := sequenceEnd and
|
|
(removeLast or
|
|
(orgRegCanBeModified or not(newRegModified))) and
|
|
(not(assigned(endp)) or
|
|
not(endp^.typ = ait_instruction) or
|
|
(noHardCodedRegs(paicpu(endP),orgReg,newReg) and
|
|
RegSizesOk(orgReg,newReg,paicpu(endP)) and
|
|
not(newRegModified and
|
|
(orgReg in PPaiProp(endP^.optInfo)^.usedRegs) and
|
|
not(RegLoadedWithNewValue(orgReg,true,paicpu(endP))))));
|
|
if SequenceEnd then
|
|
begin
|
|
{$ifdef replaceregdebug}
|
|
hp := new(pai_asm_comment,init(strpnew(
|
|
'replacing '+att_reg2str[newreg]+' with '+att_reg2str[orgreg]+
|
|
' from here...')));
|
|
hp^.next := p;
|
|
hp^.previous := p^.previous;
|
|
p^.previous := hp;
|
|
if assigned(hp^.previous) then
|
|
hp^.previous^.next := hp;
|
|
|
|
hp := new(pai_asm_comment,init(strpnew(
|
|
'replaced '+att_reg2str[newreg]+' with '+att_reg2str[orgreg]+
|
|
' till here')));
|
|
hp^.next := endp^.next;
|
|
hp^.previous := endp;
|
|
endp^.next := hp;
|
|
if assigned(hp^.next) then
|
|
hp^.next^.previous := hp;
|
|
{$endif replaceregdebug}
|
|
replaceReg := true;
|
|
returnEndP := endP;
|
|
|
|
getNextInstruction(p,hp);
|
|
stateChanged := false;
|
|
while hp <> endP do
|
|
begin
|
|
if {not(PPaiProp(hp^.optInfo)^.canBeRemoved) and }
|
|
(hp^.typ = ait_instruction) then
|
|
stateChanged :=
|
|
doReplaceReg(paicpu(hp),newReg,orgReg) or stateChanged;
|
|
if stateChanged then
|
|
updateStates(orgReg,newReg,hp,true);
|
|
getNextInstruction(hp,hp)
|
|
end;
|
|
if assigned(endp) and (endp^.typ = ait_instruction) then
|
|
readStateChanged :=
|
|
DoReplaceReadReg(paicpu(endP),newReg,orgReg);
|
|
if stateChanged or readStateChanged then
|
|
updateStates(orgReg,newReg,endP,stateChanged);
|
|
|
|
if stateChanged or readStateChanged then
|
|
updateState(orgReg,endP);
|
|
|
|
{ the replacing stops either at the moment that }
|
|
{ a) the newreg gets loaded with a new value (one not depending on the }
|
|
{ current value of newreg) }
|
|
{ b) newreg is completely replaced in this sequence and it's current value }
|
|
{ isn't used anymore }
|
|
{ In case b, the newreg was completely replaced by oldreg, so it's contents }
|
|
{ are unchanged compared the start of this sequence, so restore them }
|
|
If removeLast or
|
|
RegLoadedWithNewValue(newReg,true,endP) then
|
|
GetLastInstruction(endP,hp)
|
|
else hp := endP;
|
|
if removeLast or
|
|
(p <> endp) or
|
|
not RegLoadedWithNewValue(newReg,true,endP) then
|
|
RestoreRegContentsTo(newReg,c,p,hp);
|
|
|
|
{ In both case a and b, it is possible that the new register was modified }
|
|
{ (e.g. an add/sub), so if it was replaced by oldreg in that instruction, }
|
|
{ oldreg's contents have been changed. To take this into account, we simply }
|
|
{ set the contents of orgreg to "unknown" after this sequence }
|
|
if newRegModified then
|
|
ClearRegContentsFrom(orgReg,p,hp);
|
|
if removeLast then
|
|
ppaiprop(endP^.optinfo)^.canBeRemoved := true;
|
|
allocRegBetween(asml,orgReg,p,endP);
|
|
|
|
end
|
|
{$ifdef replaceregdebug}
|
|
else
|
|
begin
|
|
hp := new(pai_asm_comment,init(strpnew(
|
|
'replacing '+att_reg2str[newreg]+' with '+att_reg2str[orgreg]+
|
|
' from here...')));
|
|
hp^.previous := p^.previous;
|
|
hp^.next := p;
|
|
p^.previous := hp;
|
|
if assigned(hp^.previous) then
|
|
hp^.previous^.next := hp;
|
|
|
|
hp := new(pai_asm_comment,init(strpnew(
|
|
'replacing '+att_reg2str[newreg]+' with '+att_reg2str[orgreg]+
|
|
' failed here')));
|
|
hp^.next := endp^.next;
|
|
hp^.previous := endp;
|
|
endp^.next := hp;
|
|
if assigned(hp^.next) then
|
|
hp^.next^.previous := hp;
|
|
end;
|
|
{$endif replaceregdebug}
|
|
End;
|
|
|
|
Function FindRegWithConst(p: Pai; size: topsize; l: longint; Var Res: TRegister): Boolean;
|
|
{Finds a register which contains the constant l}
|
|
Var Counter: TRegister;
|
|
{$ifdef testing}
|
|
hp: pai;
|
|
{$endif testing}
|
|
tmpresult: boolean;
|
|
Begin
|
|
Counter := R_NO;
|
|
repeat
|
|
inc(counter);
|
|
tmpresult := (ppaiprop(p^.optInfo)^.regs[counter].typ in
|
|
[con_const,con_noRemoveConst]) and
|
|
(paicpu(PPaiProp(p^.OptInfo)^.Regs[Counter].StartMod)^.opsize = size) and
|
|
(paicpu(PPaiProp(p^.OptInfo)^.Regs[Counter].StartMod)^.oper[0].typ = top_const) and
|
|
(paicpu(PPaiProp(p^.OptInfo)^.Regs[Counter].StartMod)^.oper[0].val = l);
|
|
{$ifdef testing}
|
|
if (ppaiprop(p^.optInfo)^.regs[counter].typ in [con_const,con_noRemoveConst]) then
|
|
begin
|
|
hp := new(pai_asm_comment,init(strpnew(
|
|
'checking const load of '+tostr(l)+' here...')));
|
|
hp^.next := PPaiProp(p^.OptInfo)^.Regs[Counter].StartMod;
|
|
hp^.previous := PPaiProp(p^.OptInfo)^.Regs[Counter].StartMod^.previous;
|
|
PPaiProp(p^.OptInfo)^.Regs[Counter].StartMod^.previous := hp;
|
|
if assigned(hp^.previous) then
|
|
hp^.previous^.next := hp;
|
|
end;
|
|
{$endif testing}
|
|
until tmpresult or (Counter = R_EDI);
|
|
res := counter;
|
|
FindRegWithConst := tmpResult;
|
|
End;
|
|
|
|
procedure removePrevNotUsedLoad(p: pai; reg: tRegister; check: boolean);
|
|
{ If check = true, it means the procedure has to check whether it isn't }
|
|
{ possible that the contents are still used after p (used when removing }
|
|
{ instructions because of a "call"), otherwise this is not necessary }
|
|
{ (e.g. when you have a "mov 8(%ebp),%eax", you can be sure the previous }
|
|
{ value of %eax isn't used anymore later on) }
|
|
var
|
|
hp1: pai;
|
|
begin
|
|
if getLastInstruction(p,hp1) then
|
|
with ppaiprop(hp1^.optInfo)^.regs[reg] do
|
|
if (typ in [con_ref,con_invalid]) and
|
|
(nrOfMods = 1) and
|
|
(rState = ppaiprop(startmod^.optInfo)^.regs[reg].rState) and
|
|
(not(check) or
|
|
(not(regInInstruction(reg,p)) and
|
|
(not(reg in usableregs) and
|
|
(startmod^.typ = ait_instruction) and
|
|
((paicpu(startmod)^.opcode = A_MOV) or
|
|
(paicpu(startmod)^.opcode = A_MOVZX) or
|
|
(paicpu(startmod)^.opcode = A_MOVSX)) and
|
|
(paicpu(startmod)^.oper[0].typ = top_ref) and
|
|
(paicpu(startmod)^.oper[0].ref^.base = stack_pointer)) or
|
|
not(reg in ppaiprop(hp1^.optInfo)^.usedRegs) or
|
|
findRegDealloc(reg,p))) then
|
|
ppaiprop(startMod^.optInfo)^.canBeRemoved := true;
|
|
end;
|
|
|
|
|
|
procedure DoCSE(AsmL: PAasmOutput; First, Last: Pai; findPrevSeqs, doSubOpts: boolean);
|
|
{marks the instructions that can be removed by RemoveInstructs. They're not
|
|
removed immediately because sometimes an instruction needs to be checked in
|
|
two different sequences}
|
|
var cnt, cnt2, orgNrOfMods: longint;
|
|
p, hp1, hp2, prevSeq, prevSeq_next: Pai;
|
|
hp3, hp4: pai;
|
|
hp5 : pai;
|
|
RegInfo: TRegInfo;
|
|
RegCounter: TRegister;
|
|
Begin
|
|
p := First;
|
|
SkipHead(p);
|
|
While (p <> Last) Do
|
|
Begin
|
|
Case p^.typ Of
|
|
ait_align:
|
|
if not(pai_align(p)^.use_op) then
|
|
SetAlignReg(p);
|
|
ait_instruction:
|
|
Begin
|
|
Case Paicpu(p)^.opcode Of
|
|
A_CALL:
|
|
for regCounter := R_EAX to R_EBX do
|
|
removePrevNotUsedLoad(p,regCounter,true);
|
|
A_CLD: If GetLastInstruction(p, hp1) And
|
|
(PPaiProp(hp1^.OptInfo)^.DirFlag = F_NotSet) Then
|
|
PPaiProp(Pai(p)^.OptInfo)^.CanBeRemoved := True;
|
|
A_MOV, A_MOVZX, A_MOVSX:
|
|
Begin
|
|
hp2 := p;
|
|
Case Paicpu(p)^.oper[0].typ Of
|
|
top_ref, top_reg:
|
|
if (paicpu(p)^.oper[1].typ = top_reg) then
|
|
Begin
|
|
With PPaiProp(p^.OptInfo)^.Regs[Reg32(Paicpu(p)^.oper[1].reg)] Do
|
|
Begin
|
|
if assigned(startmod) and
|
|
(startmod = p)then
|
|
orgNrOfMods := ppaiprop(startmod^.optinfo)^.
|
|
regs[reg32(paicpu(p)^.oper[1].reg)].nrOfMods
|
|
else
|
|
orgNrOfMods := 0;
|
|
If (p = StartMod) And
|
|
GetLastInstruction (p, hp1) And
|
|
(hp1^.typ <> ait_marker) Then
|
|
{so we don't try to check a sequence when p is the first instruction of the block}
|
|
begin
|
|
{$ifdef csdebug}
|
|
hp5 := new(pai_asm_comment,init(strpnew(
|
|
'cse checking '+att_reg2str[Reg32(Paicpu(p)^.oper[1].reg)])));
|
|
insertLLItem(asml,p,p^.next,hp5);
|
|
{$endif csdebug}
|
|
If CheckSequence(p,prevSeq,Paicpu(p)^.oper[1].reg, Cnt, RegInfo, findPrevSeqs) And
|
|
(Cnt > 0) Then
|
|
Begin
|
|
hp1 := nil;
|
|
{ although it's perfectly ok to remove an instruction which doesn't contain }
|
|
{ the register that we've just checked (CheckSequence takes care of that), }
|
|
{ the sequence containing this other register should also be completely }
|
|
{ checked and removed, otherwise we may get situations like this: }
|
|
{ }
|
|
{ movl 12(%ebp), %edx movl 12(%ebp), %edx }
|
|
{ movl 16(%ebp), %eax movl 16(%ebp), %eax }
|
|
{ movl 8(%edx), %edx movl 8(%edx), %edx }
|
|
{ movl (%eax), eax movl (%eax), eax }
|
|
{ cmpl %eax, %edx cmpl %eax, %edx }
|
|
{ jnz l123 getting converted to jnz l123 }
|
|
{ movl 12(%ebp), %edx movl 4(%eax), eax }
|
|
{ movl 16(%ebp), %eax }
|
|
{ movl 8(%edx), %edx }
|
|
{ movl 4(%eax), eax }
|
|
Cnt2 := 1;
|
|
While Cnt2 <= Cnt Do
|
|
Begin
|
|
(* If not(regInInstruction(Paicpu(hp2)^.oper[1].reg, p)) and
|
|
not(ppaiprop(p^.optinfo)^.canBeRemoved) then
|
|
begin
|
|
if (p^.typ = ait_instruction) And
|
|
((paicpu(p)^.OpCode = A_MOV) or
|
|
(paicpu(p)^.opcode = A_MOVZX) or
|
|
(paicpu(p)^.opcode = A_MOVSX)) And
|
|
(paicpu(p)^.oper[1].typ = top_reg) then
|
|
begin
|
|
regCounter := reg32(paicpu(p)^.oper[1].reg);
|
|
if (regCounter in reginfo.regsStillUsedAfterSeq) then
|
|
begin
|
|
if (hp1 = nil) then
|
|
hp1 := reginfo.lastReload[regCounter];
|
|
end
|
|
{$ifndef noremove}
|
|
else
|
|
begin
|
|
hp5 := p;
|
|
for cnt3 := ppaiprop(p^.optinfo)^.regs[regCounter].nrofmods downto 1 do
|
|
begin
|
|
if regModifiedByInstruction(regCounter,hp5) then
|
|
PPaiProp(hp5^.OptInfo)^.CanBeRemoved := True;
|
|
getNextInstruction(hp5,hp5);
|
|
end;
|
|
end
|
|
{$endif noremove}
|
|
end
|
|
end *)
|
|
{$ifndef noremove}
|
|
{ else }
|
|
PPaiProp(p^.OptInfo)^.CanBeRemoved := True
|
|
{$endif noremove}
|
|
; Inc(Cnt2);
|
|
GetNextInstruction(p, p);
|
|
End;
|
|
{hp4 is used to get the contents of the registers before the sequence}
|
|
GetLastInstruction(hp2, hp4);
|
|
|
|
getNextInstruction(prevSeq,prevSeq_next);
|
|
{$IfDef CSDebug}
|
|
For RegCounter := R_EAX To R_EDI Do
|
|
If (RegCounter in RegInfo.RegsLoadedForRef) Then
|
|
Begin
|
|
hp5 := new(pai_asm_comment,init(strpnew('New: '+att_reg2str[RegCounter]+', Old: '+
|
|
att_reg2str[RegInfo.New2OldReg[RegCounter]])));
|
|
InsertLLItem(AsmL, Pai(hp2^.previous), hp2, hp5);
|
|
End;
|
|
{$EndIf CSDebug}
|
|
{ If some registers were different in the old and the new sequence, move }
|
|
{ the contents of those old registers to the new ones }
|
|
For RegCounter := R_EAX To R_EDI Do
|
|
If Not(RegCounter in [R_ESP,procinfo^.framepointer]) And
|
|
(RegInfo.New2OldReg[RegCounter] <> R_NO) Then
|
|
Begin
|
|
AllocRegBetween(AsmL,RegInfo.New2OldReg[RegCounter],
|
|
PPaiProp(prevSeq^.OptInfo)^.Regs[RegInfo.New2OldReg[RegCounter]].StartMod,hp2);
|
|
if hp4 <> prevSeq then
|
|
begin
|
|
if assigned(reginfo.lastReload[regCounter]) then
|
|
getLastInstruction(reginfo.lastReload[regCounter],hp3)
|
|
else if assigned(reginfo.lastReload[regInfo.New2OldReg[regCounter]]) then
|
|
getLastInstruction(reginfo.lastReload[regInfo.new2OldReg[regCounter]],hp3)
|
|
else hp3 := hp4;
|
|
if prevSeq_next <> hp3 then
|
|
clearRegContentsFrom(regCounter,prevSeq_next,
|
|
hp3);
|
|
getnextInstruction(hp3,hp3);
|
|
allocRegBetween(asmL,regCounter,prevSeq,hp3);
|
|
end;
|
|
If Not(RegCounter In RegInfo.RegsLoadedForRef) And
|
|
{old reg new reg}
|
|
(RegInfo.New2OldReg[RegCounter] <> RegCounter) Then
|
|
Begin
|
|
getLastInstruction(p,hp3);
|
|
If (hp4 <> prevSeq) or
|
|
not(regCounter in usableRegs + [R_EDI,R_ESI]) or
|
|
not ReplaceReg(asmL,RegInfo.New2OldReg[RegCounter],
|
|
regCounter,hp3,
|
|
PPaiProp(PrevSeq^.optInfo)^.Regs[regCounter],true,hp5) then
|
|
begin
|
|
hp3 := New(Pai_Marker,Init(NoPropInfoEnd));
|
|
InsertLLItem(AsmL, prevSeq, Pai(prevSeq^.next), hp3);
|
|
hp5 := New(Paicpu,Op_Reg_Reg(A_MOV, S_L,
|
|
{old reg new reg}
|
|
RegInfo.New2OldReg[RegCounter], RegCounter));
|
|
new(ppaiprop(hp5^.optinfo));
|
|
ppaiprop(hp5^.optinfo)^ := ppaiprop(prevSeq_next^.optinfo)^;
|
|
ppaiprop(hp5^.optinfo)^.canBeRemoved := false;
|
|
InsertLLItem(AsmL, prevSeq, Pai(prevSeq^.next), hp5);
|
|
hp3 := New(Pai_Marker,Init(NoPropInfoStart));
|
|
InsertLLItem(AsmL, prevSeq, Pai(prevSeq^.next), hp3);
|
|
{ adjusts states in previous instruction so that it will }
|
|
{ definitely be different from the previous or next state }
|
|
incstate(ppaiprop(hp5^.optinfo)^.
|
|
regs[RegInfo.New2OldReg[RegCounter]].rstate,20);
|
|
incstate(ppaiprop(hp5^.optinfo)^.
|
|
regs[regCounter].wstate,20);
|
|
updateState(RegInfo.New2OldReg[RegCounter],
|
|
hp5);
|
|
end
|
|
End
|
|
Else
|
|
{ imagine the following code: }
|
|
{ normal wrong optimized }
|
|
{ movl 8(%ebp), %eax movl 8(%ebp), %eax }
|
|
{ movl (%eax), %eax movl (%eax), %eax }
|
|
{ cmpl 8(%ebp), %eax cmpl 8(%ebp), %eax }
|
|
{ jne l1 jne l1 }
|
|
{ movl 8(%ebp), %eax }
|
|
{ movl (%eax), %edi movl %eax, %edi }
|
|
{ movl %edi, -4(%ebp) movl %edi, -4(%ebp) }
|
|
{ movl 8(%ebp), %eax }
|
|
{ pushl 70(%eax) pushl 70(%eax) }
|
|
{ }
|
|
{ The error is that at the moment that the last instruction is executed, }
|
|
{ %eax doesn't contain 8(%ebp) anymore. Solution: the contents of }
|
|
{ registers that are completely removed from a sequence (= registers in }
|
|
{ RegLoadedForRef, have to be changed to their contents from before the }
|
|
{ sequence. }
|
|
If RegCounter in RegInfo.RegsLoadedForRef Then
|
|
Begin
|
|
hp3 := hp2;
|
|
{ cnt still holds the number of instructions }
|
|
{ of the sequence, so go to the end of it }
|
|
for cnt2 := 1 to pred(cnt) Do
|
|
getNextInstruction(hp3,hp3);
|
|
{ hp4 = instruction prior to start of sequence }
|
|
restoreRegContentsTo(regCounter,
|
|
PPaiProp(hp4^.OptInfo)^.Regs[RegCounter],
|
|
hp2,hp3);
|
|
End;
|
|
End;
|
|
If hp1 <> nil Then
|
|
p := hp1;
|
|
Continue;
|
|
End
|
|
Else
|
|
If (PPaiProp(p^.OptInfo)^.
|
|
regs[reg32(paicpu(p)^.oper[1].reg)].typ
|
|
in [con_ref,con_noRemoveRef]) and
|
|
(PPaiProp(p^.OptInfo)^.CanBeRemoved) Then
|
|
if (cnt > 0) then
|
|
begin
|
|
p := hp2;
|
|
Cnt2 := 1;
|
|
While Cnt2 <= Cnt Do
|
|
Begin
|
|
If RegInInstruction(Paicpu(hp2)^.oper[1].reg, p) Then
|
|
PPaiProp(p^.OptInfo)^.CanBeRemoved := False;
|
|
Inc(Cnt2);
|
|
GetNextInstruction(p, p);
|
|
End;
|
|
Continue;
|
|
End
|
|
else
|
|
begin
|
|
{ Fix for web bug 972 }
|
|
regCounter := Reg32(Paicpu(p)^.oper[1].reg);
|
|
cnt := PPaiProp(p^.optInfo)^.Regs[regCounter].nrOfMods;
|
|
hp3 := p;
|
|
for cnt2 := 1 to cnt do
|
|
if not(regModifiedByInstruction(regCounter,hp3) and
|
|
not(PPaiProp(hp3^.optInfo)^.canBeRemoved)) then
|
|
getNextInstruction(hp3,hp3)
|
|
else
|
|
break;
|
|
getLastInstruction(p,hp4);
|
|
RestoreRegContentsTo(regCounter,
|
|
PPaiProp(hp4^.optInfo)^.Regs[regCounter],
|
|
p,hp3);
|
|
end;
|
|
End;
|
|
End;
|
|
{ try to replace the new reg with the old reg }
|
|
if not(PPaiProp(p^.optInfo)^.canBeRemoved) then
|
|
if (paicpu(p)^.oper[0].typ = top_reg) and
|
|
(paicpu(p)^.oper[1].typ = top_reg) and
|
|
{ only remove if we're not storing something in a regvar }
|
|
(paicpu(p)^.oper[1].reg in (usableregs+[R_EDI])) and
|
|
(paicpu(p)^.opcode = A_MOV) and
|
|
getLastInstruction(p,hp4) and
|
|
{ we only have to start replacing from the instruction after the mov, }
|
|
{ but replacereg only starts with getnextinstruction(p,p) }
|
|
replaceReg(asmL,paicpu(p)^.oper[0].reg,
|
|
paicpu(p)^.oper[1].reg,p,
|
|
ppaiprop(hp4^.optInfo)^.regs[paicpu(p)^.oper[1].reg],false,hp1) then
|
|
begin
|
|
ppaiprop(p^.optInfo)^.canBeRemoved := true;
|
|
allocRegBetween(asmL,paicpu(p)^.oper[0].reg,
|
|
ppaiProp(p^.optInfo)^.regs[paicpu(p)^.oper[0].reg].startMod,hp1);
|
|
end
|
|
else
|
|
if (paicpu(p)^.oper[1].typ = top_reg) and
|
|
not regInOp(paicpu(p)^.oper[1].reg,paicpu(p)^.oper[0]) then
|
|
removePrevNotUsedLoad(p,reg32(paicpu(p)^.oper[1].reg),false);
|
|
{ at first, only try optimizations of large blocks, because doing }
|
|
{ doing smaller ones may prevent bigger ones from completing in }
|
|
{ in the next pass }
|
|
if not doSubOpts and (orgNrOfMods <> 0) then
|
|
begin
|
|
p := hp2;
|
|
for cnt := 1 to pred(orgNrOfMods) do
|
|
getNextInstruction(p,p);
|
|
end;
|
|
End;
|
|
top_symbol,Top_Const:
|
|
Begin
|
|
Case Paicpu(p)^.oper[1].typ Of
|
|
Top_Reg:
|
|
Begin
|
|
regCounter := Reg32(Paicpu(p)^.oper[1].reg);
|
|
If GetLastInstruction(p, hp1) Then
|
|
With PPaiProp(hp1^.OptInfo)^.Regs[regCounter] Do
|
|
if (typ in [con_const,con_noRemoveConst]) and
|
|
(paicpu(startMod)^.opsize >= paicpu(p)^.opsize) and
|
|
opsequal(paicpu(StartMod)^.oper[0],paicpu(p)^.oper[0]) Then
|
|
begin
|
|
PPaiProp(p^.OptInfo)^.CanBeRemoved := True;
|
|
allocRegBetween(asmL,regCounter,startMod,p);
|
|
end
|
|
else
|
|
removePrevNotUsedLoad(p,reg32(paicpu(p)^.oper[1].reg),false);
|
|
|
|
End;
|
|
Top_Ref:
|
|
if (paicpu(p)^.oper[0].typ = top_const) and
|
|
getLastInstruction(p,hp1) and
|
|
findRegWithConst(hp1,paicpu(p)^.opsize,paicpu(p)^.oper[0].val,regCounter) then
|
|
begin
|
|
paicpu(p)^.loadreg(0,regCounter);
|
|
allocRegBetween(AsmL,reg32(regCounter),
|
|
PPaiProp(hp1^.optinfo)^.regs[regCounter].startMod,p);
|
|
end;
|
|
End;
|
|
End;
|
|
End;
|
|
|
|
End;
|
|
A_STD: If GetLastInstruction(p, hp1) And
|
|
(PPaiProp(hp1^.OptInfo)^.DirFlag = F_Set) Then
|
|
PPaiProp(Pai(p)^.OptInfo)^.CanBeRemoved := True;
|
|
End
|
|
End;
|
|
End;
|
|
GetNextInstruction(p, p);
|
|
End;
|
|
End;
|
|
|
|
function removeInstructs(asmL: paasmoutput; first, last: pai): boolean;
|
|
{ Removes the marked instructions and disposes the PPaiProps of the other }
|
|
{ instructions }
|
|
Var p, hp1: Pai;
|
|
begin
|
|
removeInstructs := false;
|
|
p := First;
|
|
While (p <> Last) Do
|
|
Begin
|
|
If (p^.typ = ait_marker) and
|
|
(pai_marker(p)^.kind = noPropInfoStart) then
|
|
begin
|
|
hp1 := pai(p^.next);
|
|
asmL^.remove(p);
|
|
dispose(p,done);
|
|
while not((hp1^.typ = ait_marker) and
|
|
(pai_marker(p)^.kind = noPropInfoEnd)) do
|
|
begin
|
|
p := pai(hp1^.next);
|
|
{$ifndef noinstremove}
|
|
{ allocregbetween can insert new ait_regalloc objects }
|
|
{ without optinfo }
|
|
if assigned(hp1^.optinfo) then
|
|
if ppaiprop(hp1^.optinfo)^.canBeRemoved then
|
|
begin
|
|
dispose(ppaiprop(hp1^.optinfo));
|
|
hp1^.optinfo := nil;
|
|
asmL^.remove(hp1);
|
|
dispose(hp1,done);
|
|
hp1 := p;
|
|
end
|
|
else
|
|
{$endif noinstremove}
|
|
begin
|
|
dispose(ppaiprop(hp1^.optinfo));
|
|
hp1^.optinfo := nil;
|
|
end;
|
|
hp1 := p;
|
|
end;
|
|
p := pai(hp1^.next);
|
|
asmL^.remove(hp1);
|
|
dispose(hp1,done);
|
|
end
|
|
else
|
|
{$ifndef noinstremove}
|
|
if assigned(p^.optInfo) and
|
|
PPaiProp(p^.optInfo)^.canBeRemoved then
|
|
begin
|
|
hp1 := pai(p^.next);
|
|
AsmL^.Remove(p);
|
|
Dispose(p, Done);
|
|
p := hp1;
|
|
removeInstructs := true;
|
|
End
|
|
Else
|
|
{$endif noinstremove}
|
|
Begin
|
|
p^.OptInfo := nil;
|
|
p := pai(p^.next);;
|
|
End;
|
|
End;
|
|
FreeMem(PaiPropBlock, NrOfPaiObjs*SizeOf(TPaiProp))
|
|
End;
|
|
|
|
function CSE(AsmL: PAasmOutput; First, Last: Pai; pass: longint): boolean;
|
|
Begin
|
|
DoCSE(AsmL, First, Last, not(cs_slowoptimize in aktglobalswitches) or (pass >= 2),
|
|
not(cs_slowoptimize in aktglobalswitches) or (pass >= 1));
|
|
{ register renaming }
|
|
if not(cs_slowoptimize in aktglobalswitches) or (pass > 0) then
|
|
doRenaming(asmL, first, last);
|
|
cse := removeInstructs(asmL, first, last);
|
|
End;
|
|
|
|
End.
|
|
|
|
{
|
|
$Log$
|
|
Revision 1.2 2000-10-24 10:40:53 jonas
|
|
+ register renaming ("fixes" bug1088)
|
|
* changed command line options meanings for optimizer:
|
|
O2 now means peepholopts, CSE and register renaming in 1 pass
|
|
O3 is the same, but repeated until no further optimizations are
|
|
possible or until 5 passes have been done (to avoid endless loops)
|
|
* changed aopt386 so it does this looping
|
|
* added some procedures from csopt386 to the interface because they're
|
|
used by rropt386 as well
|
|
* some changes to csopt386 and daopt386 so that newly added instructions
|
|
by the CSE get optimizer info (they were simply skipped previously),
|
|
this fixes some bugs
|
|
|
|
Revision 1.1 2000/10/15 09:47:43 peter
|
|
* moved to i386/
|
|
|
|
Revision 1.14 2000/09/30 13:07:23 jonas
|
|
* fixed support for -Or with new features of CSE
|
|
|
|
Revision 1.13 2000/09/29 23:14:45 jonas
|
|
* search much further back for CSE sequences (non-conflicting stores are
|
|
now passed)
|
|
* remove more unnecessary loads of registers (especially the self pointer)
|
|
|
|
Revision 1.12 2000/09/26 11:49:41 jonas
|
|
* writes to register variables and to the self pointer now also count as
|
|
memore writes
|
|
|
|
Revision 1.11 2000/09/25 09:50:29 jonas
|
|
- removed TP conditional code
|
|
|
|
Revision 1.10 2000/09/24 15:06:14 peter
|
|
* use defines.inc
|
|
|
|
Revision 1.9 2000/09/22 15:01:59 jonas
|
|
* fixed some bugs in the previous improvements: in some cases, esi was
|
|
still being replaced before a conditional jump (the code that
|
|
detected conditional jumps sometimes skipped over them)
|
|
|
|
Revision 1.8 2000/09/20 15:00:58 jonas
|
|
+ much improved CSE: the CSE now searches further back for sequences it
|
|
can reuse. After I've also implemented register renaming, the effect
|
|
should be even better (afaik web bug 1088 will then even be optimized
|
|
properly). I don't know about the slow down factor this adds. Maybe
|
|
a new optimization level should be introduced?
|
|
|
|
Revision 1.7 2000/08/25 19:40:45 jonas
|
|
* refined previous fix a bit, some instructions weren't being removed
|
|
while they could (merged from fixes branch)
|
|
* made checksequence a bit faster
|
|
|
|
Revision 1.6 2000/08/23 12:55:10 jonas
|
|
* fix for web bug 1112 and a bit of clean up in csopt386 (merged from
|
|
fixes branch)
|
|
|
|
Revision 1.5 2000/08/04 20:08:03 jonas
|
|
* improved detection of range of instructions which use a register
|
|
(merged from fixes branch)
|
|
|
|
Revision 1.4 2000/07/21 15:19:54 jonas
|
|
* daopt386: changes to getnextinstruction/getlastinstruction so they
|
|
ignore labels who have is_addr set
|
|
+ daopt386/csopt386: remove loads of registers which are overwritten
|
|
before their contents are used (especially usefull for removing superfluous
|
|
maybe_loadesi outputs and push/pops transformed by below optimization
|
|
+ popt386: transform pop/pop/pop/.../push/push/push to sequences of
|
|
'movl x(%esp),%reg' (only active when compiling a go32v2 compiler
|
|
currently because I don't know whether it's safe to do this under Win32/
|
|
Linux (because of problems we had when using esp as frame pointer on
|
|
those os'es)
|
|
|
|
Revision 1.3 2000/07/14 05:11:48 michael
|
|
+ Patch to 1.1
|
|
|
|
Revision 1.2 2000/07/13 11:32:39 michael
|
|
+ removed logs
|
|
|
|
}
|