{ $Id$ Copyright (c) 1997-98 by Jonas Maebe This unit contains the data flow analyzer and several helper procedures and functions. This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 2 of the License, or (at your option) any later version. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with this program; if not, write to the Free Software Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. **************************************************************************** } Unit DAOpt386; Interface Uses AAsm, CObjects {$ifdef i386} ,i386 {$endif} ; {*********************** Procedures and Functions ************************} Procedure InsertLLItem(AsmL: PAasmOutput; prev, foll, new_one: PLinkedList_Item); Function Reg32(Reg: TRegister): TRegister; Function RefsEqual(Const R1, R2: TReference): Boolean; Function IsGP32Reg(Reg: TRegister): Boolean; Function RegInRef(Reg: TRegister; Const Ref: TReference): Boolean; Function RegInInstruction(Reg: TRegister; p1: Pai): Boolean; Function PowerOf2(L: Longint): Longint; Function GetNextInstruction(Current: Pai; Var Next: Pai): Boolean; Function GetLastInstruction(Current: Pai; Var Last: Pai): Boolean; Function RegsSameContent(p1, p2: Pai; Reg: TRegister): Boolean; Function InstructionsEqual(p1, p2: Pai): Boolean; Procedure DFAPass1(AsmL: PAasmOutput); Function DFAPass2(AsmL: PAasmOutput): Pai; Function FindLabel(L: PLabel; Var hp: Pai): Boolean; {Procedure FindLoHiLabels(AsmL: PAasmOutput; Var LoLab, HiLab, LabDif: Longint);} {******************************* Constants *******************************} Const {ait_* types which don't result in executable code or which don't influence the way the program runs/behaves} SkipInstr = [ait_comment {$ifdef GDB} ,ait_stabs, ait_stabn, ait_stab_function_name {$endif GDB} {$ifdef regalloc} ,ait_regalloc, ait_regdealloc {$endif regalloc} ]; {the maximum number of things (registers, memory, ...) a single instruction changes} MaxCh = 3; {Possible register content types} con_Unknown = 0; con_ref = 1; con_const = 2; {********************************* Types *********************************} Type {What an instruction can change} TChange = (C_None, C_EAX, C_ECX, C_EDX, C_EBX, C_ESP, C_EBP, C_ESI, C_EDI, C_CDirFlag {clear direction flag}, C_SDirFlag {set dir flag}, C_Flags, C_FPU, C_Op1, C_Op2, C_Op3, C_MemEDI); {the possible states of a flag} TFlagContents = (F_Unknown, F_NotSet, F_Set); {the properties of a cpu instruction} TAsmInstrucProp = Record {how many things it changes} NCh: Byte; {and what it changes} Ch: Array[1..MaxCh] of TChange; End; TContent = Record {start and end of block instructions that defines the content of this register. If Typ = con_const, then Longint(StartMod) = value of the constant)} StartMod: Pointer; {starts at 0, gets increased everytime the register is modified} State: Word; {how many instructions starting with StarMod does the block consist of} NrOfMods: Byte; {if one register gets a block assigned from an other register, this variable holds the name of that register (so it can be substituted when checking the block afterwards)} { ModReg: TRegister; } {the tpye of the content of the register: constant, ...} Typ: Byte; End; {Contents of the integer registers} TRegContent = Array[R_NO..R_EDI] Of TContent; {contents of the FPU registers} TRegFPUContent = Array[R_ST..R_ST7] Of TContent; {information record with the contents of every register. Every Pai object gets one of these assigned: a pointer to it is stored in the Line field and the original line number is stored in LineSave} TPaiProp = Record Regs: TRegContent; { FPURegs: TRegFPUContent;} {currently not yet used} LineSave: Longint; {status of the direction flag} DirFlag: TFlagContents; {can this instruction be removed?} CanBeRemoved: Boolean; End; PPaiProp = ^TPaiProp; {$IfDef TP} TPaiPropBlock = Array[1..(65520 div (((SizeOf(TPaiProp)+1)div 2)*2))] Of TPaiProp; {$else} TPaiPropBlock = Array[1..250000] Of TPaiProp; {$EndIf TP} PPaiPropBlock = ^TPaiPropBlock; {$IfDef JmpAnal} TLabelTableItem = Record p: Pai; {$IfDef TP} RefsFound: Byte; {$Else TP} RefsFound: Word; {$EndIf TP} AlreadyProcessed: Boolean; End; {$Else JmpAnal} TLabelTableItem = Pai; {$Endif JmpAnal} {$IfDef tp} TLabelTable = Array[0..9000] Of TLabelTableItem; {$Else tp} TLabelTable = Array[0..2500000] Of TLabelTableItem; {$Endif tp} PLabelTable = ^TLabelTable; TwoWords = Record Word1, Word2: Word; End; {******************************* Variables *******************************} Var {the amount of PaiObjects in the current assembler list} NrOfPaiObjs, {for TP only: the amount of PPaiProps that can be stored in the PaiPropBlock} NrOfPaiFast: Longint; {Array which holds all (FPC) or as much as possible (TP) PPaiProps} PaiPropBlock: PPaiPropBlock; LoLab, HiLab, LabDif: Longint; LTable: PLabelTable; {*********************** End of Interface section ************************} Implementation Uses globals, systems, strings, verbose, hcodegen, {$ifdef i386} cgi386; {$endif i386} Const AsmInstr: Array[tasmop] Of TAsmInstrucProp = ( {MOV} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {MOVZX} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {MOVSX} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {LABEL} (NCh: 255; Ch: (C_None, C_None, C_None)), {don't know value of any register} {ADD} (NCh: 2; Ch: (C_Op2, C_Flags, C_None)), {CALL} (NCh: 255; Ch: (C_None, C_None, C_None)), {don't know value of any register} {IDIV} (NCh: 3; Ch: (C_EAX, C_EDX, C_Flags)), {IMUL} (NCh: 3; Ch: (C_EAX, C_EDX, C_Flags)), {handled separately, because several forms exist} {JMP} (NCh: 255; Ch: (C_None, C_None, C_None)), {don't know value of any register} {LEA} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {MUL} (NCh: 3; Ch: (C_EAX, C_EDX, C_Flags)), {NEG} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {NOT} (NCh: 2; Ch: (C_Op1, C_Flags, C_None)), {POP} (NCh: 2; Ch: (C_Op1, C_ESP, C_None)), {POPAD} (NCh: 255; Ch: (C_None, C_None, C_None)), {don't know value of any register} {PUSH} (NCh: 1; Ch: (C_ESP, C_None, C_None)), {PUSHAD} (NCh: 1; Ch: (C_ESP, C_None, C_None)), {RET} (NCh: 255; Ch: (C_None, C_None, C_None)), {don't know value of any register} {SUB} (NCh: 2; Ch: (C_Op2, C_Flags, C_None)), {XCHG} (NCh: 2; Ch: (C_Op1, C_Op2, C_None)), {(will be) handled seperately} {XOR} (NCh: 2; Ch: (C_Op2, C_Flags, C_None)), {FILD} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {CMP} (NCh: 1; Ch: (C_Flags, C_None, C_None)), {JZ} (NCh: 0; Ch: (C_None, C_None, C_None)), {INC} (NCh: 2; Ch: (C_Op1, C_Flags, C_None)), {DEC} (NCh: 2; Ch: (C_Op1, C_Flags, C_None)), {SETE} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {SETNE} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {SETL} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {SETG} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {SETLE} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {SETGE} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {JE} (NCh: 0; Ch: (C_None, C_None, C_None)), {JNE} (NCh: 0; Ch: (C_None, C_None, C_None)), {JL} (NCh: 0; Ch: (C_None, C_None, C_None)), {JG} (NCh: 0; Ch: (C_None, C_None, C_None)), {JLE} (NCh: 0; Ch: (C_None, C_None, C_None)), {JGE} (NCh: 0; Ch: (C_None, C_None, C_None)), {OR} (NCh: 2; Ch: (C_Op2, C_Flags, C_None)), {FLD} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FADD} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FMUL} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FSUB} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FDIV} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FCHS} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FLD1} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FIDIV} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {CLTD} (NCh: 1; Ch: (C_EDX, C_None, C_None)), {JNZ} (NCh: 0; Ch: (C_None, C_None, C_None)), {FSTP} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {AND} (NCh: 2; Ch: (C_Op2, C_Flags, C_None)), {JNO} (NCh: 0; Ch: (C_None, C_None, C_None)), {NOTH} (NCh: 0; Ch: (C_None, C_None, C_None)), {***???***} {NONE} (NCh: 0; Ch: (C_None, C_None, C_None)), {ENTER} (NCh: 1; Ch: (C_ESP, C_None, C_None)), {LEAVE} (NCh: 1; Ch: (C_ESP, C_None, C_None)), {CLD} (NCh: 1; Ch: (C_CDirFlag, C_None, C_None)), {MOVS} (NCh: 3; Ch: (C_ESI, C_EDI, C_MemEDI)), {REP} (NCh: 1; Ch: (C_ECX, C_None, C_None)), {SHL} (NCh: 2; Ch: (C_Op2, C_Flags, C_None)), {SHR} (NCh: 2; Ch: (C_Op2, C_Flags, C_None)), {BOUND} (NCh: 0; Ch: (C_None, C_None, C_None)), {JNS} (NCh: 0; Ch: (C_None, C_None, C_None)), {JS} (NCh: 0; Ch: (C_None, C_None, C_None)), {JO} (NCh: 0; Ch: (C_None, C_None, C_None)), {SAR} (NCh: 2; Ch: (C_Op2, C_Flags, C_None)), {TEST} (NCh: 1; Ch: (C_Flags, C_None, C_None)), {FCOM} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FCOMP} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FCOMPP} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FXCH} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FADDP} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FMULP} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FSUBP} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FDIVP} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FNSTS} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {SAHF} (NCh: 1; Ch: (C_Flags, C_None, C_None)), {FDIVRP} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FSUBRP} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {SETC} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {SETNC} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {JC} (NCh: 0; Ch: (C_None, C_None, C_None)), {JNC} (NCh: 0; Ch: (C_None, C_None, C_None)), {JA} (NCh: 0; Ch: (C_None, C_None, C_None)), {JAE} (NCh: 0; Ch: (C_None, C_None, C_None)), {JB} (NCh: 0; Ch: (C_None, C_None, C_None)), {JBE} (NCh: 0; Ch: (C_None, C_None, C_None)), {SETA} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {SETAE} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {SETB} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {SETBE} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {AAA} (NCh: 2; Ch: (C_EAX, C_Flags, C_None)), {AAD} (NCh: 2; Ch: (C_EAX, C_Flags, C_None)), {AAM} (NCh: 2; Ch: (C_EAX, C_Flags, C_None)), {AAS} (NCh: 2; Ch: (C_EAX, C_Flags, C_None)), {CBW} (NCh: 1; Ch: (C_EAX, C_None, C_None)), {CDQ} (NCh: 2; Ch: (C_EAX, C_EDX, C_None)), {CLC} (NCh: 1; Ch: (C_Flags, C_None, C_None)), {CLI} (NCh: 1; Ch: (C_Flags, C_None, C_None)), {CLTS} (NCh: 0; Ch: (C_None, C_None, C_None)), {CMC} (NCh: 1; Ch: (C_Flags, C_None, C_None)), {CWD} (NCh: 2; Ch: (C_EAX, C_EDX, C_None)), {CWDE} (NCh: 1; Ch: (C_EAX, C_None, C_None)), {DAA} (NCh: 1; Ch: (C_EAX, C_None, C_None)), {DAS} (NCh: 1; Ch: (C_EAX, C_None, C_None)), {HLT} (NCh: 0; Ch: (C_None, C_None, C_None)), {IRET} (NCh: 255; Ch: (C_None, C_None, C_None)), {don't know value of any register} {LAHF} (NCh: 1; Ch: (C_EAX, C_None, C_None)), {LODS} (NCh: 2; Ch: (C_EAX, C_ESI, C_None)), {LOCK} (NCh: 0; Ch: (C_None, C_None, C_None)), {NOP} (NCh: 0; Ch: (C_None, C_None, C_None)), {PUSHA} (NCh: 1; Ch: (C_ESP, C_None, C_None)), {PUSHF} (NCh: 1; Ch: (C_ESP, C_None, C_None)), {PUSHFD} (NCh: 1; Ch: (C_ESP, C_None, C_None)), {STC} (NCh: 1; Ch: (C_Flags, C_None, C_None)), {STD} (NCh: 1; Ch: (C_SDirFlag, C_None, C_None)), {STI} (NCh: 1; Ch: (C_Flags, C_None, C_None)), {STOS} (NCh: 2; Ch: (C_MemEDI, C_EDI, C_None)), {WAIT} (NCh: 0; Ch: (C_None, C_None, C_None)), {XLAT} (NCh: 1; Ch: (C_EAX, C_None, C_None)), {XLATB} (NCh: 1; Ch: (C_EAX, C_None, C_None)), {MOVSB} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {MOVSBL} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {MOVSBW} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {MOVSWL} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {MOVZB} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {MOVZWL} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {POPA} (NCh: 255; Ch: (C_None, C_None, C_None)), {don't know value of any register} {IN} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {OUT} (NCh: 0; Ch: (C_None, C_None, C_None)), {LDS} (NCh: 2; Ch: (C_Op2, C_None, C_None)), {LCS} (NCh: 2; Ch: (C_Op2, C_None, C_None)), {LES} (NCh: 2; Ch: (C_Op2, C_None, C_None)), {LFS} (NCh: 2; Ch: (C_Op2, C_None, C_None)), {LGS} (NCh: 2; Ch: (C_Op2, C_None, C_None)), {LSS} (NCh: 2; Ch: (C_Op2, C_None, C_None)), {POPF} (NCh: 2; Ch: (C_Flags, C_ESP, C_None)), {SBB} (NCh: 2; Ch: (C_Op2, C_Flags, C_None)), {ADC} (NCh: 2; Ch: (C_Op2, C_Flags, C_None)), {DIV} (NCh: 3; Ch: (C_EAX, C_EDX, C_Flags)), {ROR} (NCh: 2; Ch: (C_Op2, C_Flags, C_None)), {ROL} (NCh: 2; Ch: (C_Op2, C_Flags, C_None)), {RCL} (NCh: 2; Ch: (C_Op2, C_Flags, C_None)), {RCR} (NCh: 2; Ch: (C_Op2, C_Flags, C_None)), {SAL} (NCh: 2; Ch: (C_Op2, C_Flags, C_None)), {SHLD} (NCh: 2; Ch: (C_Op3, C_Flags, C_None)), {SHRD} (NCh: 2; Ch: (C_Op3, C_Flags, C_None)), {LCALL} (NCh: 255; Ch: (C_None, C_None, C_None)), {don't know value of any register} {LJMP} (NCh: 255; Ch: (C_None, C_None, C_None)), {don't know value of any register} {LRET} (NCh: 255; Ch: (C_None, C_None, C_None)), {don't know value of any register} {JNAE} (NCh: 0; Ch: (C_None, C_None, C_None)), {JNB} (NCh: 0; Ch: (C_None, C_None, C_None)), {JNA} (NCh: 0; Ch: (C_None, C_None, C_None)), {JNBE} (NCh: 0; Ch: (C_None, C_None, C_None)), {JP} (NCh: 0; Ch: (C_None, C_None, C_None)), {JNP} (NCh: 0; Ch: (C_None, C_None, C_None)), {JPE} (NCh: 0; Ch: (C_None, C_None, C_None)), {JPO} (NCh: 0; Ch: (C_None, C_None, C_None)), {JNGE} (NCh: 0; Ch: (C_None, C_None, C_None)), {JNG} (NCh: 0; Ch: (C_None, C_None, C_None)), {JNL} (NCh: 0; Ch: (C_None, C_None, C_None)), {JNLE} (NCh: 0; Ch: (C_None, C_None, C_None)), {JCXZ} (NCh: 0; Ch: (C_None, C_None, C_None)), {JECXZ} (NCh: 0; Ch: (C_None, C_None, C_None)), {LOOP} (NCh: 1; Ch: (C_ECX, C_None, C_None)), {CMPS} (NCh: 3; Ch: (C_ESI, C_EDI, C_Flags)), {INS} (NCh: 1; Ch: (C_EDI, C_None, C_None)), {OUTS} (NCh: 1; Ch: (C_ESI, C_None, C_None)), {SCAS} (NCh: 2; Ch: (C_EDI, C_Flags, C_None)), {BSF} (NCh: 2; Ch: (C_Op2, C_Flags, C_None)), {BSR} (NCh: 2; Ch: (C_Op2, C_Flags, C_None)), {BT} (NCh: 1; Ch: (C_Flags, C_None, C_None)), {BTC} (NCh: 2; Ch: (C_Op2, C_Flags, C_None)), {BTR} (NCh: 2; Ch: (C_Op2, C_Flags, C_None)), {BTS} (NCh: 2; Ch: (C_Op2, C_Flags, C_None)), {INT} (NCh: 255; Ch: (C_None, C_None, C_None)), {don't know value of any register} {INT3} (NCh: 0; Ch: (C_None, C_None, C_None)), {INTO} (NCh: 255; Ch: (C_None, C_None, C_None)), {don't know value of any register} {BOUNDL} (NCh: 0; Ch: (C_None, C_None, C_None)), {BOUNDW} (NCh: 0; Ch: (C_None, C_None, C_None)), {LOOPZ} (NCh: 1; Ch: (C_ECX, C_None, C_None)), {LOOPE} (NCh: 1; Ch: (C_ECX, C_None, C_None)), {LOOPNZ} (NCh: 1; Ch: (C_ECX, C_None, C_None)), {LOOPNE} (NCh: 1; Ch: (C_ECX, C_None, C_None)), {SETO} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {SETNO} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {SETNAE} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {SETNB} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {SETZ} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {SETNZ} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {SETNA} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {SETNBE} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {SETS} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {SETNS} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {SETP} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {SETPE} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {SETNP} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {SETPO} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {SETNGE} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {SETNL} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {SETNG} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {SETNLE} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {ARPL} (NCh: 1; Ch: (C_Flags, C_None, C_None)), {LAR} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {LGDT} (NCh: 0; Ch: (C_None, C_None, C_None)), {LIDT} (NCh: 0; Ch: (C_None, C_None, C_None)), {LLDT} (NCh: 0; Ch: (C_None, C_None, C_None)), {LMSW} (NCh: 0; Ch: (C_None, C_None, C_None)), {LSL} (NCh: 2; Ch: (C_Op2, C_Flags, C_None)), {LTR} (NCh: 0; Ch: (C_None, C_None, C_None)), {SGDT} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {SIDT} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {SLDT} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {SMSW} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {STR} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {VERR} (NCh: 1; Ch: (C_Flags, C_None, C_None)), {VERW} (NCh: 1; Ch: (C_Flags, C_None, C_None)), {FABS} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FBLD} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FBSTP} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {FCLEX} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FNCLEX} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FCOS} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FDECSTP}(NCh: 1; Ch: (C_FPU, C_None, C_None)), {FDISI} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FNDISI} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FDIVR} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FENI} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FNENI} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FFREE} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FIADD} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FICOM} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FICOMP} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FIDIVR} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FIMUL} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FINCSTP}(NCh: 1; Ch: (C_FPU, C_None, C_None)), {FINIT} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FNINIT} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FIST} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {FISTP} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {FISUB} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FSUBR} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FLDCW} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FLDENV} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FLDLG2} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FLDLN2} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FLDL2E} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FLDL2T} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FLDPI} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FLDS} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FLDZ} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FNOP} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FPATAN} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FPREM} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FPREM1} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FPTAN} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FRNDINT}(NCh: 1; Ch: (C_FPU, C_None, C_None)), {FRSTOR} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FSAVE} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {FNSAVE} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FSCALE} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FSETPM} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FSIN} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FSINCOS}(NCh: 1; Ch: (C_FPU, C_None, C_None)), {FSQRT} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FST} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {FSTCW} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {FNSTCW} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {FSTENV} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {FNSTENV}(NCh: 1; Ch: (C_Op1, C_None, C_None)), {FSTSW} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {FNSTSW} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {FTST} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FUCOM} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FUCOMP} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FUCOMPP}(NCh: 1; Ch: (C_FPU, C_None, C_None)), {FWAIT} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FXAM} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FXTRACT}(NCh: 1; Ch: (C_FPU, C_None, C_None)), {FYL2X} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FYL2XP1}(NCh: 1; Ch: (C_FPU, C_None, C_None)), {F2XM1} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FILDQ} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FILDS} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FILDL} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FLDL} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FLDT} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FISTQ} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {FISTS} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {FISTL} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {FSTL} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {FSTS} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {FSTPS} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {FISTPL} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {FSTPL} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {FISTPS} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {FISTPQ} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {FSTPT} (NCh: 1; Ch: (C_Op1, C_None, C_None)), {FCOMPS} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FICOMPL}(NCh: 1; Ch: (C_FPU, C_None, C_None)), {FCOMPL} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FICOMPS}(NCh: 1; Ch: (C_FPU, C_None, C_None)), {FCOMS} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FICOML} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FCOML} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FICOMS} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FIADDL} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FADDL} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FIADDS} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FISUBL} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FSUBL} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FISUBS} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FSUBS} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FSUBR} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FSUBRS} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FISUBRL}(NCh: 1; Ch: (C_FPU, C_None, C_None)), {FSUBRL} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FISUBRS}(NCh: 1; Ch: (C_FPU, C_None, C_None)), {FMULS} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FIMUL} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FMULL} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FIMULS} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FIDIVS} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FIDIVL} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FDIVL} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FIDIVS} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FDIVRS} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FIDIVRL}(NCh: 1; Ch: (C_FPU, C_None, C_None)), {FDIVRL} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {FIDIVRS}(NCh: 1; Ch: (C_FPU, C_None, C_None)), {REPE} (NCh: 0; Ch: (C_ECX, C_None, C_None)), {REPNE} (NCh: 0; Ch: (C_ECX, C_None, C_None)), {FADDS} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {POPFD} (NCh: 2; Ch: (C_ESP, C_Flags, C_None)), {below are the MMX instructions} {A_EMMS} (NCh: 1; Ch: (C_FPU, C_None, C_None)), {A_MOVD} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {A_MOVQ} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {A_PACKSSDW} (NCh: 255; Ch: (C_FPU, C_None, C_None)), {A_PACKSSWB} (NCh: 255; Ch: (C_FPU, C_None, C_None)), {A_PACKUSWB} (NCh: 255; Ch: (C_FPU, C_None, C_None)), {A_PADDB} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {A_PADDD} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {A_PADDSB} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {A_PADDSW} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {A_PADDUSB} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {A_PADDUSW} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {A_PADDW} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {A_PAND} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {A_PANDN} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {A_PCMPEQB} (NCh: 255; Ch: (C_FPU, C_None, C_None)), {A_PCMPEQD} (NCh: 255; Ch: (C_FPU, C_None, C_None)), {A_PCMPEQW} (NCh: 255; Ch: (C_FPU, C_None, C_None)), {A_PCMPGTB} (NCh: 255; Ch: (C_FPU, C_None, C_None)), {A_PCMPGTD} (NCh: 255; Ch: (C_FPU, C_None, C_None)), {A_PCMPGTW} (NCh: 255; Ch: (C_FPU, C_None, C_None)), {A_PMADDWD} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {A_PMULHW} (NCh: 255; Ch: (C_FPU, C_None, C_None)), {A_PMULLW} (NCh: 255; Ch: (C_FPU, C_None, C_None)), {A_POR} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {A_PSLLD} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {A_PSLLQ} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {A_PSLLW} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {A_PSRAD} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {A_PSRAW} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {A_PSRLD} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {A_PSRLQ} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {A_PSRLW} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {A_PSUBB} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {A_PSUBD} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {A_PSUBSB} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {A_PSUBSW} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {A_PSUBUSB} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {A_PSUBUSW} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {A_PSUBW} (NCh: 1; Ch: (C_Op2, C_None, C_None)), {A_PUNPCKHBW} (NCh: 255; Ch: (C_FPU, C_None, C_None)), {A_PUNPCKHDQ} (NCh: 255; Ch: (C_FPU, C_None, C_None)), {A_PUNPCKHWD} (NCh: 255; Ch: (C_FPU, C_None, C_None)), {A_PUNPCKLBW} (NCh: 255; Ch: (C_FPU, C_None, C_None)), {A_PUNPCKLDQ} (NCh: 255; Ch: (C_FPU, C_None, C_None)), {A_PUNPCKLWD} (NCh: 255; Ch: (C_FPU, C_None, C_None)), {A_PXOR} (NCh: 1; Ch: (C_Op2, C_None, C_None))); Var {How many instructions are betwen the current instruction and the last one that modified the register} NrOfInstrSinceLastMod: Array[R_EAX..R_EDI] Of Byte; {************************ Create the Label table ************************} Procedure FindLoHiLabels(AsmL: PAasmOutput; Var LoLab, HiLab, LabDif: Longint); {Walks through the paasmlist to find the lowest and highest label number; Since 0.9.3: also removes unused labels} Var LabelFound: Boolean; P, hp1: Pai; Begin LabelFound := False; LoLab := MaxLongint; HiLab := 0; P := Pai(AsmL^.first); While Assigned(p) Do Begin If (Pai(p)^.typ = ait_label) Then If (Pai_Label(p)^.l^.is_used) Then Begin LabelFound := True; If (Pai_Label(p)^.l^.nb < LoLab) Then LoLab := Pai_Label(p)^.l^.nb; If (Pai_Label(p)^.l^.nb > HiLab) Then HiLab := Pai_Label(p)^.l^.nb; End Else Begin hp1 := pai(p^.next); AsmL^.Remove(p); Dispose(p, Done); p := hp1; continue; End; p := pai(p^.next); End; If LabelFound Then LabDif := HiLab+1-LoLab Else LabDif := 0; End; Procedure BuildLabelTable(AsmL: PAasmOutput; Var LabelTable: PLabelTable; LowLabel: Longint; Var LabelDif: Longint); {Builds a table with the locations of the labels in the paasmoutput} Var p: Pai; Begin If (LabelDif <> 0) Then Begin {$IfDef TP} If (MaxAvail >= LabelDif*SizeOf(Pai)) Then Begin {$EndIf TP} GetMem(LabelTable, LabelDif*SizeOf(TLabelTableItem)); FillChar(LabelTable^, LabelDif*SizeOf(TLabelTableItem), 0); p := pai(AsmL^.first); While Assigned(p) Do Begin If (Pai(p)^.typ = ait_label) Then {$IfDef JmpAnal} LabelTable^[Pai_Label(p)^.l^.nb-LowLabel].p := p; {$Else JmpAnal} LabelTable^[Pai_Label(p)^.l^.nb-LowLabel] := p; {$EndIf JmpAnal} p := pai(p^.next); End; {$IfDef TP} End Else LabelDif := 0; {$EndIf TP} End; End; {************************ Search the Label table ************************} Function FindLabel(L: PLabel; Var hp: Pai): Boolean; {searches for the specified label starting from hp as long as the encountered instructions are labels, to be able to optimize constructs like jne l2 jmp l2 jmp l3 and l1: l1: l2: l2:} Var TempP: Pai; Begin TempP := hp; While Assigned(TempP) and (pai(TempP)^.typ In SkipInstr + [ait_label]) Do If (pai_label(TempP)^.l <> L) Then TempP := Pai(TempP^.next) Else Begin hp := TempP; FindLabel := True; exit End; FindLabel := False End; {************************ Some general functions ************************} Function Reg32(Reg: TRegister): TRegister; {Returns the 32 bit component of Reg if it exists, otherwise Reg is returned} Begin Reg32 := Reg; If (Reg >= R_AX) Then If (Reg <= R_DI) Then Reg32 := Reg16ToReg32(Reg) Else If (Reg <= R_BL) Then Reg32 := Reg8toReg32(Reg); End; Function PowerOf2(L: Longint): Longint; Var Counter, TempVal: Longint; Begin TempVal := 1; For Counter := 1 to L Do TempVal := TempVal * 2; PowerOf2 := TempVal; End; { inserts new_one between prev and foll } Procedure InsertLLItem(AsmL: PAasmOutput; prev, foll, new_one: PLinkedList_Item); Begin If Assigned(prev) Then If Assigned(foll) Then Begin If Assigned(new_one) Then Begin new_one^.previous := prev; new_one^.next := foll; prev^.next := new_one; foll^.previous := new_one; End; End Else AsmL^.Concat(new_one) Else If Assigned(Foll) Then AsmL^.Insert(new_one) End; {********************* Compare parts of Pai objects *********************} Function RefsEqual(Const R1, R2: TReference): Boolean; Begin If R1.IsIntValue Then RefsEqual := R2.IsIntValue and (R1.Offset = R2.Offset) Else If (R1.Offset = R2.Offset) And (R1.Base = R2.Base) And (R1.Index = R2.Index) And (R1.Segment = R2.Segment) And (R1.ScaleFactor = R2.ScaleFactor) Then Begin If Assigned(R1.Symbol) Then RefsEqual := Assigned(R2.Symbol) And (R1.Symbol^=R2.Symbol^) Else RefsEqual := Not(Assigned(R2.Symbol)); End Else RefsEqual := False; End; Function IsGP32Reg(Reg: TRegister): Boolean; {Checks if the register is a 32 bit general purpose register} Begin If (Reg >= R_EAX) and (Reg <= R_EBX) Then IsGP32Reg := True Else IsGP32reg := False End; Function RegInRef(Reg: TRegister; Const Ref: TReference): Boolean; Begin {checks whether Ref contains a reference to Reg} Reg := Reg32(Reg); RegInRef := (Ref.Base = Reg) Or (Ref.Index = Reg) End; Function RegInInstruction(Reg: TRegister; p1: Pai): Boolean; {checks if Reg is used by the instruction p1} Var TmpResult: Boolean; Begin TmpResult := False; If (Pai(p1)^.typ = ait_instruction) Then Begin Case Pai386(p1)^.op1t Of Top_Reg: TmpResult := Reg = TRegister(Pai386(p1)^.op1); Top_Ref: TmpResult := RegInRef(Reg, TReference(Pai386(p1)^.op1^)) End; If Not(TmpResult) Then Case Pai386(p1)^.op2t Of Top_Reg: if Pai386(p1)^.op3t<>Top_reg then TmpResult := Reg = TRegister(Pai386(p1)^.op2) else TmpResult := longint(Reg) = twowords(Pai386(p1)^.op2).word1; Top_Ref: TmpResult := RegInRef(Reg, TReference(Pai386(p1)^.op2^)) End; If Not(TmpResult) Then Case Pai386(p1)^.op3t Of Top_Reg: TmpResult := longint(Reg) =twowords(Pai386(p1)^.op2).word2; Top_none:; else internalerror($Da); End End; RegInInstruction := TmpResult End; {********************* GetNext and GetLastInstruction *********************} Function GetNextInstruction(Current: Pai; Var Next: Pai): Boolean; {skips ait_regalloc, ait_regdealloc and ait_stab* objects and puts the next pai object in Next. Returns false if there isn't any} Begin GetNextInstruction := False; Current := Pai(Current^.Next); While Assigned(Current) And (Pai(Current)^.typ In SkipInstr) Do Current := Pai(Current^.Next); If Assigned(Current) Then Begin Next := Current; GetNextInstruction := True; End; End; Function GetLastInstruction(Current: Pai; Var Last: Pai): Boolean; {skips the ait-types in SkipInstr puts the previous pai object in Last. Returns false if there isn't any} Begin GetLastInstruction := False; Current := Pai(Current^.previous); While Assigned(Current) And (Pai(Current)^.typ In SkipInstr) Do Current := Pai(Current^.previous); If Assigned(Current) Then Begin Last := Current; GetLastInstruction := True; End; End; {******************* The Data Flow Analyzer functions ********************} (*Function FindZeroreg(p: Pai; Var Result: TRegister): Boolean; {Finds a register which contains the constant zero} Var Counter: TRegister; Begin Counter := R_EAX; FindZeroReg := True; While (Counter <= R_EDI) And ((PPaiProp(p^.fileinfo.line)^.Regs[Counter].Typ <> Con_Const) or (PPaiProp(p^.fileinfo.line)^.Regs[Counter].StartMod <> Pointer(0))) Do Inc(Byte(Counter)); If (PPaiProp(p^.fileinfo.line)^.Regs[Counter].Typ = Con_Const) And (PPaiProp(p^.fileinfo.line)^.Regs[Counter].StartMod = Pointer(0)) Then Result := Counter Else FindZeroReg := False; End;*) Function TCh2Reg(Ch: TChange): TRegister; {converts a TChange variable to a TRegister} Begin If (CH <= C_EDI) Then TCh2Reg := TRegister(Byte(Ch)) Else InternalError($db) End; Procedure DestroyReg(p1: pai; Reg: TRegister); {Destroys the contents of the register Reg in the PPaiProp of P} Var TmpState: Longint; Begin Reg := Reg32(Reg); NrOfInstrSinceLastMod[Reg] := 0; If (Reg >= R_EAX) And (Reg <= R_EDI) Then Begin TmpState := PPaiProp(p1^.fileinfo.line)^.Regs[Reg].State+1; FillChar(PPaiProp(p1^.fileinfo.line)^.Regs[Reg], SizeOf(TContent), 0); PPaiProp(p1^.fileinfo.line)^.Regs[Reg].State := TmpState; End; End; Function OpsEqual(typ: Longint; op1, op2: Pointer): Boolean; Begin {checks whether the two ops are equal} Case typ Of Top_Reg, Top_Const: OpsEqual := op1 = op2; Top_Ref: OpsEqual := RefsEqual(TReference(op1^), TReference(op2^)); Top_None: OpsEqual := True Else OpsEqual := False End; End; Function RegsSameContent(p1, p2: Pai; Reg: TRegister): Boolean; {checks whether Reg has the same content in the PPaiProp of p1 and p2} Begin Reg := Reg32(Reg); RegsSameContent := PPaiProp(p1^.fileinfo.line)^.Regs[Reg].State = PPaiProp(p2^.fileinfo.line)^.Regs[Reg].State; End; Function InstructionsEqual(p1, p2: Pai): Boolean; Begin {checks whether two Pai386 instructions are equal} InstructionsEqual := Assigned(p1) And Assigned(p2) And {$ifdef regalloc} ((((Pai(p1)^.typ = ait_regalloc) And (Pai(p2)^.typ = ait_regalloc)) Or ((Pai(p1)^.typ = ait_regdealloc) And (Pai(p2)^.typ = ait_regdealloc))) And (PaiRegAlloc(p1)^.reg = PaiRegAlloc(p2)^.reg)) Or {$endif regalloc} ((Pai(p1)^.typ = ait_instruction) And (Pai(p1)^.typ = ait_instruction) And (Pai386(p1)^._operator = Pai386(p2)^._operator) And (Pai386(p1)^.op1t = Pai386(p2)^.op1t) And (Pai386(p1)^.op2t = Pai386(p2)^.op2t) And OpsEqual(Pai386(p1)^.op1t, Pai386(p1)^.op1, Pai386(p2)^.op1) And OpsEqual(Pai386(p1)^.op2t, Pai386(p1)^.op2, Pai386(p2)^.op2)) End; Procedure DestroyRefs(p: pai; Const Ref: TReference; WhichRegNot: TRegister); {destroys all registers which possibly contain a reference to Ref} Var Counter: TRegister; Begin WhichRegNot := Reg32(WhichRegNot); If (Ref.base <> R_NO) Or (Ref.index <> R_NO) Then Begin If (Ref.base = ProcInfo.FramePointer) Then {write something to a parameter or a local variable} For Counter := R_EAX to R_EDI Do With PPaiProp(p^.fileinfo.line)^.Regs[Counter] Do Begin If (Counter <> WhichRegNot) And (typ = Con_Ref) And (Pai(StartMod)^.typ = ait_instruction) And (Pai386(StartMod)^.op1t = top_ref) And (RefsEqual(TReference(Pai386(StartMod)^.op1^), Ref) Or (Not(cs_UncertainOpts in AktSwitches) And (NrOfMods <> 1))) Then DestroyReg(p, Counter) End Else {writing something to a pointer location} For Counter := R_EAX to R_EDI Do With PPaiProp(p^.fileinfo.line)^.Regs[Counter] Do If (Counter <> WhichRegNot) And (typ = Con_Ref) And (Not(cs_UncertainOpts in AktSwitches) Or (Ref.Base = R_EDI) Or (Not((NrOfMods = 1) And (Pai(StartMod)^.typ = ait_instruction) And (Pai386(StartMod)^.op1t = top_ref) And (PReference(Pai386(StartMod)^.op1)^.base = ProcInfo.FramePointer)))) Then DestroyReg(p, Counter) {we don't know what memory location the reference points to, so we just destroy every register which contains a memory reference} End Else {the ref is a var name or we just have a reference an absolute offset} Begin For Counter := R_EAX to R_EDI Do If (Counter <> WhichRegNot) And (PPaiProp(p^.fileinfo.line)^.Regs[Counter].typ = Con_Ref) And (Not(cs_UncertainOpts in AktSwitches) Or RefsEqual(Ref, TReference(Pai386(PPaiProp(p^.fileinfo.line)^.Regs[Counter].StartMod)^.op1^))) Then DestroyReg(p, Counter) End; End; Procedure DestroyAllRegs(p: Pai); Var Counter: TRegister; Begin {initializes/desrtoys all registers} For Counter := R_EAX To R_EDI Do DestroyReg(p, Counter); PPaiProp(p^.fileinfo.line)^.DirFlag := F_Unknown; End; Procedure Destroy(PaiObj: Pai; opt: Longint; Op: Pointer); Begin Case opt Of top_reg: DestroyReg(PaiObj, TRegister(Op)); top_ref: DestroyRefs(PaiObj, TReference(Op^), R_NO); top_symbol:; End; End; Procedure DFAPass1(AsmL: PAasmOutput); {gathers the RegAlloc data... still need to think about where to store it} Begin FindLoHiLabels(AsmL, LoLab, HiLab, LabDif); BuildLabelTable(AsmL, LTable, LoLab, LabDif); End; Function DoDFAPass2(First: Pai): Pai; {Analyzes the Data Flow of an assembler list. Starts creating the reg contents for the instructions starting with p. Returns the last pai which has been processed} Var TmpProp: PPaiProp; Cnt, InstrCnt: Longint; InstrProp: TAsmInstrucProp; p: Pai; TmpRef: TReference; TmpReg: TRegister; Begin p := First; InstrCnt := 1; FillChar(NrOfInstrSinceLastMod, SizeOf(NrOfInstrSinceLastMod), 0); While Assigned(p) Do Begin DoDFAPass2 := p; If (InstrCnt <= NrOfPaiFast) Then TmpProp := @PaiPropBlock^[InstrCnt] Else New(TmpProp); If (p <> First) Then TmpProp^ := PPaiProp(Pai(p^.previous)^.fileinfo.line)^ Else FillChar(TmpProp^, SizeOf(TmpProp^), 0); TmpProp^.linesave := p^.fileinfo.line; PPaiProp(p^.fileinfo.line) := TmpProp; For TmpReg := R_EAX To R_EDI Do Inc(NrOfInstrSinceLastMod[TmpReg]); Case p^.typ Of ait_label: DestroyAllRegs(p); ait_labeled_instruction {$ifdef GDB} , ait_stabs, ait_stabn, ait_stab_function_name {$endif GDB} :; {nothing changes} {$ifdef regalloc} ait_regalloc, ait_regdealloc:; {$endif regalloc} ait_instruction: Begin InstrProp := AsmInstr[Pai386(p)^._operator]; Case Pai386(p)^._operator Of A_MOV, A_MOVZX, A_MOVSX: Begin Case Pai386(p)^.op1t Of Top_Reg: Case Pai386(p)^.op2t Of Top_Reg: Begin DestroyReg(p, TRegister(Pai386(p)^.op2)); { TmpProp^.Regs[TRegister(Pai386(p)^.op2)] := TmpProp^.Regs[TRegister(Pai386(p)^.op1)]; If (TmpProp^.Regs[TRegister(Pai386(p)^.op2)].ModReg = R_NO) Then TmpProp^.Regs[TRegister(Pai386(p)^.op2)].ModReg := Tregister(Pai386(p)^.op1);} End; Top_Ref: DestroyRefs(p, TReference(Pai386(p)^.op2^), TRegister(Pai386(p)^.op1)); End; Top_Ref: Begin {destination is always a register in this case} TmpReg := Reg32(TRegister(Pai386(p)^.op2)); If (RegInRef(TmpReg, TReference(Pai386(p)^.op1^))) Then Begin With PPaiProp(Pai(p)^.fileinfo.line)^.Regs[TmpReg] Do Begin Inc(State); If (typ <> Con_Ref) Then Begin typ := Con_Ref; StartMod := p; End; {also store how many instructions are part of the sequence in the first instructions PPaiProp, so it can be easily accessed from within CheckSequence} Inc(NrOfMods, NrOfInstrSinceLastMod[TmpReg]); PPaiProp(Pai(StartMod)^.fileinfo.line)^.Regs[TmpReg].NrOfMods := NrOfMods; NrOfInstrSinceLastMod[TmpReg] := 0; End; End Else Begin DestroyReg(p, TmpReg); With PPaiProp(Pai(p)^.fileinfo.line)^.Regs[TmpReg] Do Begin Typ := Con_Ref; StartMod := p; NrOfMods := 1; End; End; End; Top_Const: Begin Case Pai386(p)^.op2t Of Top_Reg: Begin TmpReg := Reg32(TRegister(Pai386(p)^.op2)); With TmpProp^.Regs[TmpReg] Do Begin {it doesn't matter that the state is changed, it isn't looked at when removing constant reloads} DestroyReg(p, TmpReg); typ := Con_Const; StartMod := Pai386(p)^.op1; End End; Top_Ref: DestroyRefs(P, TReference(Pai386(p)^.op2^), R_NO); End; End; End; End; A_IMUL: Begin If (Pai386(p)^.Op3t = top_none) Then If (Pai386(p)^.Op2t = top_none) Then Begin DestroyReg(p, R_EAX); DestroyReg(p, R_EDX) End Else Begin If (Pai386(p)^.Op2t = top_reg) Then DestroyReg(p, TRegister(Pai386(p)^.Op2)); End Else If (Pai386(p)^.Op3t = top_reg) Then DestroyReg(p, TRegister(longint(twowords(Pai386(p)^.Op2).word2))); End; A_XOR: Begin If (Pai386(p)^.op1t = top_reg) And (Pai386(p)^.op2t = top_reg) And (Pai386(p)^.op1 = Pai386(p)^.op2) Then Begin DestroyReg(p, Tregister(Pai386(p)^.op1)); TmpProp^.Regs[Reg32(Tregister(Pai386(p)^.op1))].typ := Con_Const; TmpProp^.Regs[Reg32(Tregister(Pai386(p)^.op1))].StartMod := Pointer(0) End Else Destroy(p, Pai386(p)^.op2t, Pai386(p)^.op2); End Else Begin If InstrProp.NCh <> 255 Then For Cnt := 1 To InstrProp.NCh Do Case InstrProp.Ch[Cnt] Of C_None:; C_EAX..C_EDI: DestroyReg(p, TCh2Reg(InstrProp.Ch[Cnt])); C_CDirFlag: PPaiProp(Pai(p)^.fileinfo.line)^.DirFlag := F_NotSet; C_SDirFlag: PPaiProp(Pai(p)^.fileinfo.line)^.DirFlag := F_Set; C_Op1: Destroy(p, Pai386(p)^.op1t, Pai386(p)^.op1); C_Op2: Destroy(p, Pai386(p)^.op2t, Pai386(p)^.op2); C_Op3: Destroy(p, Pai386(p)^.op2t, Pointer(Longint(TwoWords(Pai386(p)^.op2).word2))); C_MemEDI: Begin FillChar(TmpRef, SizeOf(TmpRef), 0); TmpRef.Base := R_EDI; DestroyRefs(p, TmpRef, R_NO) End; C_Flags, C_FPU:; End Else Begin DestroyAllRegs(p); End; End; End; End Else Begin DestroyAllRegs(p); End; End; Inc(InstrCnt); p := Pai(p^.next); End; End; Function InitDFAPass2(AsmL: PAasmOutput): Boolean; {reserves memory for the PPaiProps in one big memory block when not using TP, returns False if not enough memory is available for the optimizer in all cases} Var p: Pai; Begin P := Pai(AsmL^.First); NrOfPaiObjs := 1; While (P <> Pai(AsmL^.last)) Do Begin Inc(NrOfPaiObjs); P := Pai(P^.next) End; {$IfDef TP} If (MemAvail < (SizeOf(TPaiProp)*NrOfPaiObjs)) {this doesn't have to be one contiguous block} Then InitDFAPass2 := False Else Begin InitDFAPass2 := True; If (MaxAvail < 65520) Then NrOfPaiFast := MaxAvail Div (((SizeOf(TPaiProp)+1) div 2)*2) Else NrOfPaiFast := 65520 Div (((SizeOf(TPaiProp)+1) div 2)*2); If (NrOfPaiFast > 0) Then GetMem(PaiPropBlock, NrOfPaiFast*(((SizeOf(TPaiProp)+1) div 2)*2)); End; {$Else} {Uncomment the next line to see how much memory the reloading optimizer needs} { Writeln((NrOfPaiObjs*(((SizeOf(TPaiProp)+3)div 4)*4)));} {no need to check mem/maxavail, we've got as much virtual memory as we want} InitDFAPass2 := True; GetMem(PaiPropBlock, NrOfPaiObjs*(((SizeOf(TPaiProp)+3)div 4)*4)); NrOfPaiFast := NrOfPaiObjs; {$EndIf TP} End; Function DFAPass2(AsmL: PAasmOutPut): Pai; Begin If InitDFAPass2(AsmL) Then DFAPass2 := DoDFAPass2(Pai(AsmL^.First)) Else DFAPass2 := Nil; End; End.