mirror of
https://gitlab.com/freepascal.org/fpc/source.git
synced 2025-04-28 22:27:03 +02:00

* merged isconvertable and is_equal into compare_defs(_ext) * made operator search faster by walking the list only once
481 lines
19 KiB
ObjectPascal
481 lines
19 KiB
ObjectPascal
{
|
|
$Id$
|
|
Copyright (c) 1998-2002 by Florian Klaempfl
|
|
|
|
Generate generic mathematical nodes
|
|
|
|
This program is free software; you can redistribute it and/or modify
|
|
it under the terms of the GNU General Public License as published by
|
|
the Free Software Foundation; either version 2 of the License, or
|
|
(at your option) any later version.
|
|
|
|
This program is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with this program; if not, write to the Free Software
|
|
Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
|
|
|
|
****************************************************************************
|
|
}
|
|
unit ncgmat;
|
|
|
|
{$i fpcdefs.inc}
|
|
|
|
interface
|
|
|
|
uses
|
|
node,nmat,cpubase,cgbase,cginfo;
|
|
|
|
type
|
|
tcgunaryminusnode = class(tunaryminusnode)
|
|
procedure pass_2;override;
|
|
protected
|
|
{ This routine is called to change the sign of the
|
|
floating point value in the floating point
|
|
register r.
|
|
|
|
This routine should be overriden, since
|
|
the generic version is not optimal at all. The
|
|
generic version assumes that floating
|
|
point values are stored in the register
|
|
in IEEE-754 format.
|
|
}
|
|
procedure emit_float_sign_change(r: tregister; _size : tcgsize);virtual;
|
|
end;
|
|
|
|
tcgmoddivnode = class(tmoddivnode)
|
|
procedure pass_2;override;
|
|
protected
|
|
{ This routine must do an actual 32-bit division, be it
|
|
signed or unsigned. The result must set into the the
|
|
@var(num) register.
|
|
|
|
@param(signed Indicates if the division must be signed)
|
|
@param(denum Register containing the denominator
|
|
@param(num Register containing the numerator, will also receive result)
|
|
|
|
The actual optimizations regarding shifts have already
|
|
been done and emitted, so this should really a do a divide.
|
|
}
|
|
procedure emit_div_reg_reg(signed: boolean;denum,num : tregister);virtual;abstract;
|
|
{ This routine must do an actual 32-bit modulo, be it
|
|
signed or unsigned. The result must set into the the
|
|
@var(num) register.
|
|
|
|
@param(signed Indicates if the modulo must be signed)
|
|
@param(denum Register containing the denominator
|
|
@param(num Register containing the numerator, will also receive result)
|
|
|
|
The actual optimizations regarding shifts have already
|
|
been done and emitted, so this should really a do a modulo.
|
|
}
|
|
procedure emit_mod_reg_reg(signed: boolean;denum,num : tregister);virtual;abstract;
|
|
{ This routine must do an actual 64-bit division, be it
|
|
signed or unsigned. The result must set into the the
|
|
@var(num) register.
|
|
|
|
@param(signed Indicates if the division must be signed)
|
|
@param(denum Register containing the denominator
|
|
@param(num Register containing the numerator, will also receive result)
|
|
|
|
The actual optimizations regarding shifts have already
|
|
been done and emitted, so this should really a do a divide.
|
|
Currently, this routine should only be implemented on
|
|
64-bit systems, otherwise a helper is called in 1st pass.
|
|
}
|
|
procedure emit64_div_reg_reg(signed: boolean;denum,num : tregister64);virtual;
|
|
end;
|
|
|
|
tcgshlshrnode = class(tshlshrnode)
|
|
procedure pass_2;override;
|
|
end;
|
|
|
|
|
|
implementation
|
|
|
|
uses
|
|
globtype,systems,
|
|
cutils,verbose,globals,
|
|
symconst,symdef,aasmbase,aasmtai,aasmcpu,defutil,
|
|
pass_1,pass_2,
|
|
ncon,
|
|
cpuinfo,
|
|
tgobj,ncgutil,cgobj,rgobj,rgcpu,paramgr,cg64f32;
|
|
|
|
{*****************************************************************************
|
|
TCGUNARYMINUSNODE
|
|
*****************************************************************************}
|
|
procedure tcgunaryminusnode.emit_float_sign_change(r: tregister; _size : tcgsize);
|
|
var
|
|
href : treference;
|
|
hreg : tregister;
|
|
begin
|
|
{ get a temporary memory reference to store the floating
|
|
point value
|
|
}
|
|
tg.gettemp(exprasmlist,tcgsize2size[_size],tt_normal,href);
|
|
{ store the floating point value in the temporary memory area }
|
|
cg.a_loadfpu_reg_ref(exprasmlist,_size,r,href);
|
|
{ only single and double ieee are supported }
|
|
if _size = OS_F64 then
|
|
begin
|
|
{ on little-endian machine the most significant
|
|
32-bit value is stored at the highest address
|
|
}
|
|
if target_info.endian = endian_little then
|
|
inc(href.offset,4);
|
|
end
|
|
else
|
|
if _size <> OS_F32 then
|
|
internalerror(20020814);
|
|
hreg := rg.getregisterint(exprasmlist);
|
|
{ load value }
|
|
cg.a_load_ref_reg(exprasmlist,OS_32,href,hreg);
|
|
{ bitwise complement copied value }
|
|
cg.a_op_reg_reg(exprasmlist,OP_NOT,OS_32,hreg,hreg);
|
|
{ sign-bit is bit 31/63 of single/double }
|
|
cg.a_op_const_reg(exprasmlist,OP_AND,$80000000,hreg);
|
|
{ or with value in reference memory }
|
|
cg.a_op_reg_ref(exprasmlist,OP_OR,OS_32,hreg,href);
|
|
rg.ungetregister(exprasmlist,hreg);
|
|
{ store the floating point value in the temporary memory area }
|
|
if _size = OS_F64 then
|
|
begin
|
|
{ on little-endian machine the most significant
|
|
32-bit value is stored at the highest address
|
|
}
|
|
if target_info.endian = endian_little then
|
|
dec(href.offset,4);
|
|
end;
|
|
cg.a_loadfpu_ref_reg(exprasmlist,_size,href,r);
|
|
end;
|
|
|
|
|
|
procedure tcgunaryminusnode.pass_2;
|
|
|
|
|
|
begin
|
|
if is_64bitint(left.resulttype.def) then
|
|
begin
|
|
secondpass(left);
|
|
|
|
{ load left operator in a register }
|
|
location_copy(location,left.location);
|
|
location_force_reg(exprasmlist,location,OS_64,false);
|
|
cg64.a_op64_loc_reg(exprasmlist,OP_NEG,
|
|
location,joinreg64(location.registerlow,location.registerhigh));
|
|
end
|
|
else
|
|
begin
|
|
secondpass(left);
|
|
location_reset(location,LOC_REGISTER,OS_INT);
|
|
case left.location.loc of
|
|
LOC_REGISTER:
|
|
begin
|
|
location.register:=left.location.register;
|
|
cg.a_op_reg_reg(exprasmlist,OP_NEG,OS_INT,location.register,
|
|
location.register);
|
|
end;
|
|
LOC_CREGISTER:
|
|
begin
|
|
location.register:=rg.getregisterint(exprasmlist);
|
|
cg.a_load_reg_reg(exprasmlist,OS_INT,OS_INT,left.location.register,
|
|
location.register);
|
|
cg.a_op_reg_reg(exprasmlist,OP_NEG,OS_INT,location.register,
|
|
location.register);
|
|
end;
|
|
LOC_REFERENCE,
|
|
LOC_CREFERENCE:
|
|
begin
|
|
reference_release(exprasmlist,left.location.reference);
|
|
if (left.resulttype.def.deftype=floatdef) then
|
|
begin
|
|
location_reset(location,LOC_FPUREGISTER,def_cgsize(resulttype.def));
|
|
location.register:=rg.getregisterfpu(exprasmlist);
|
|
cg.a_loadfpu_ref_reg(exprasmlist,
|
|
def_cgsize(left.resulttype.def),
|
|
left.location.reference,location.register);
|
|
emit_float_sign_change(location.register,def_cgsize(left.resulttype.def));
|
|
end
|
|
else
|
|
begin
|
|
location.register:=rg.getregisterint(exprasmlist);
|
|
{ why is the size is OS_INT, since in pass_1 we convert
|
|
everything to a signed natural value anyways
|
|
}
|
|
cg.a_load_ref_reg(exprasmlist,OS_INT,
|
|
left.location.reference,location.register);
|
|
cg.a_op_reg_reg(exprasmlist,OP_NEG,OS_INT,location.register,
|
|
location.register);
|
|
end;
|
|
end;
|
|
LOC_FPUREGISTER:
|
|
begin
|
|
location_reset(location,LOC_FPUREGISTER,def_cgsize(resulttype.def));
|
|
location.register:=left.location.register;
|
|
emit_float_sign_change(location.register,def_cgsize(left.resulttype.def));
|
|
end;
|
|
LOC_CFPUREGISTER:
|
|
begin
|
|
location_reset(location,LOC_FPUREGISTER,def_cgsize(resulttype.def));
|
|
location.register:=rg.getregisterfpu(exprasmlist);
|
|
cg.a_loadfpu_reg_reg(exprasmlist,left.location.register,location.register);
|
|
emit_float_sign_change(location.register,def_cgsize(left.resulttype.def));
|
|
end;
|
|
else
|
|
internalerror(200203225);
|
|
end;
|
|
end;
|
|
end;
|
|
|
|
|
|
{*****************************************************************************
|
|
TCGMODDIVNODE
|
|
*****************************************************************************}
|
|
|
|
procedure tcgmoddivnode.emit64_div_reg_reg(signed: boolean; denum,num:tregister64);
|
|
begin
|
|
{ handled in pass_1 already, unless pass_1 is
|
|
overriden
|
|
}
|
|
{ should be handled in pass_1 (JM) }
|
|
internalerror(200109052);
|
|
end;
|
|
|
|
|
|
procedure tcgmoddivnode.pass_2;
|
|
var
|
|
hreg1 : tregister;
|
|
hdenom,hnumerator : tregister;
|
|
shrdiv,popeax,popedx : boolean;
|
|
power : longint;
|
|
hl : tasmlabel;
|
|
pushedregs : tmaybesave;
|
|
begin
|
|
shrdiv := false;
|
|
secondpass(left);
|
|
if codegenerror then
|
|
exit;
|
|
maybe_save(exprasmlist,right.registers32,left.location,pushedregs);
|
|
secondpass(right);
|
|
maybe_restore(exprasmlist,left.location,pushedregs);
|
|
if codegenerror then
|
|
exit;
|
|
location_copy(location,left.location);
|
|
|
|
if is_64bitint(resulttype.def) then
|
|
begin
|
|
{ this code valid for 64-bit cpu's only ,
|
|
otherwise helpers are called in pass_1
|
|
}
|
|
location_force_reg(exprasmlist,location,OS_64,false);
|
|
location_copy(location,left.location);
|
|
location_force_reg(exprasmlist,right.location,OS_64,false);
|
|
emit64_div_reg_reg(is_signed(left.resulttype.def),
|
|
joinreg64(right.location.registerlow,right.location.registerhigh),
|
|
joinreg64(location.registerlow,location.registerhigh));
|
|
end
|
|
else
|
|
begin
|
|
{ put numerator in register }
|
|
location_force_reg(exprasmlist,left.location,OS_INT,false);
|
|
hreg1:=left.location.register;
|
|
|
|
if (nodetype=divn) and
|
|
(right.nodetype=ordconstn) and
|
|
ispowerof2(tordconstnode(right).value,power) then
|
|
Begin
|
|
shrdiv := true;
|
|
{ for signed numbers, the numerator must be adjusted before the
|
|
shift instruction, but not wih unsigned numbers! Otherwise,
|
|
"Cardinal($ffffffff) div 16" overflows! (JM) }
|
|
If is_signed(left.resulttype.def) Then
|
|
Begin
|
|
objectlibrary.getlabel(hl);
|
|
cg.a_cmp_const_reg_label(exprasmlist,OS_INT,OC_GT,0,hreg1,hl);
|
|
if power=1 then
|
|
cg.a_op_const_reg(exprasmlist,OP_ADD,1,hreg1)
|
|
else
|
|
cg.a_op_const_reg(exprasmlist,OP_ADD,
|
|
tordconstnode(right).value-1,hreg1);
|
|
cg.a_label(exprasmlist,hl);
|
|
cg.a_op_const_reg(exprasmlist,OP_SAR,power,hreg1);
|
|
End
|
|
Else { not signed }
|
|
Begin
|
|
cg.a_op_const_reg(exprasmlist,OP_SHR,power,hreg1);
|
|
end;
|
|
End
|
|
else
|
|
begin
|
|
{ bring denominator to hdenom }
|
|
{ hdenom is always free, it's }
|
|
{ only used for temporary }
|
|
{ purposes }
|
|
hdenom := rg.getregisterint(exprasmlist);
|
|
if right.location.loc<>LOC_CREGISTER then
|
|
location_release(exprasmlist,right.location);
|
|
cg.a_load_loc_reg(exprasmlist,right.location,hdenom);
|
|
{ verify if the divisor is zero, if so return an error
|
|
immediately
|
|
}
|
|
objectlibrary.getlabel(hl);
|
|
cg.a_cmp_const_reg_label(exprasmlist,OS_INT,OC_NE,0,hdenom,hl);
|
|
cg.a_param_const(exprasmlist,OS_S32,200,paramanager.getintparaloc(1));
|
|
cg.a_call_name(exprasmlist,'FPC_HANDLERROR');
|
|
cg.a_label(exprasmlist,hl);
|
|
if nodetype = modn then
|
|
emit_mod_reg_reg(is_signed(left.resulttype.def),hdenom,hreg1)
|
|
else
|
|
emit_div_reg_reg(is_signed(left.resulttype.def),hdenom,hreg1);
|
|
end;
|
|
location_reset(location,LOC_REGISTER,OS_INT);
|
|
location.register:=hreg1;
|
|
end;
|
|
cg.g_overflowcheck(exprasmlist,self);
|
|
end;
|
|
|
|
|
|
{*****************************************************************************
|
|
TCGSHLRSHRNODE
|
|
*****************************************************************************}
|
|
|
|
|
|
procedure tcgshlshrnode.pass_2;
|
|
var
|
|
hcountreg : tregister;
|
|
op : topcg;
|
|
l1,l2,l3 : tasmlabel;
|
|
pushedregs : tmaybesave;
|
|
freescratch : boolean;
|
|
begin
|
|
freescratch:=false;
|
|
secondpass(left);
|
|
maybe_save(exprasmlist,right.registers32,left.location,pushedregs);
|
|
secondpass(right);
|
|
maybe_restore(exprasmlist,left.location,pushedregs);
|
|
{ determine operator }
|
|
case nodetype of
|
|
shln: op:=OP_SHL;
|
|
shrn: op:=OP_SHR;
|
|
end;
|
|
|
|
if is_64bitint(left.resulttype.def) then
|
|
begin
|
|
{ already hanled in 1st pass }
|
|
internalerror(2002081501);
|
|
(* Normally for 64-bit cpu's this here should be here,
|
|
and only pass_1 need to be overriden, but dunno how to
|
|
do that!
|
|
location_reset(location,LOC_REGISTER,OS_64);
|
|
|
|
{ load left operator in a register }
|
|
location_force_reg(exprasmlist,left.location,OS_64,false);
|
|
location_copy(location,left.location);
|
|
|
|
if (right.nodetype=ordconstn) then
|
|
begin
|
|
cg64.a_op64_const_reg(exprasmlist,op,tordconstnode(right).value,
|
|
joinreg64(location.registerlow,location.registerhigh));
|
|
end
|
|
else
|
|
begin
|
|
{ this should be handled in pass_1 }
|
|
internalerror(2002081501);
|
|
|
|
if right.location.loc<>LOC_REGISTER then
|
|
begin
|
|
if right.location.loc<>LOC_CREGISTER then
|
|
location_release(exprasmlist,right.location);
|
|
hcountreg:=cg.get_scratch_reg_int(exprasmlist);
|
|
cg.a_load_loc_reg(exprasmlist,right.location,hcountreg);
|
|
freescratch := true;
|
|
end
|
|
else
|
|
hcountreg:=right.location.register;
|
|
cg64.a_op64_reg_reg(exprasmlist,op,hcountreg,
|
|
joinreg64(location.registerlow,location.registerhigh));
|
|
if freescratch then
|
|
cg.free_scratch_reg(exprasmlist,hcountreg);
|
|
end;*)
|
|
end
|
|
else
|
|
begin
|
|
{ load left operators in a register }
|
|
location_copy(location,left.location);
|
|
location_force_reg(exprasmlist,location,OS_INT,false);
|
|
|
|
{ shifting by a constant directly coded: }
|
|
if (right.nodetype=ordconstn) then
|
|
begin
|
|
{ l shl 32 should 0 imho, but neither TP nor Delphi do it in this way (FK)
|
|
if right.value<=31 then
|
|
}
|
|
cg.a_op_const_reg(exprasmlist,op,tordconstnode(right).value and 31,
|
|
location.register);
|
|
{
|
|
else
|
|
emit_reg_reg(A_XOR,S_L,hregister1,
|
|
hregister1);
|
|
}
|
|
end
|
|
else
|
|
begin
|
|
{ load right operators in a register - this
|
|
is done since most target cpu which will use this
|
|
node do not support a shift count in a mem. location (cec)
|
|
}
|
|
if right.location.loc<>LOC_REGISTER then
|
|
begin
|
|
if right.location.loc<>LOC_CREGISTER then
|
|
location_release(exprasmlist,right.location);
|
|
hcountreg:=cg.get_scratch_reg_int(exprasmlist);
|
|
freescratch := true;
|
|
cg.a_load_loc_reg(exprasmlist,right.location,hcountreg);
|
|
end
|
|
else
|
|
hcountreg:=right.location.register;
|
|
cg.a_op_reg_reg(exprasmlist,op,OS_INT,hcountreg,location.register);
|
|
if freescratch then
|
|
cg.free_scratch_reg(exprasmlist,hcountreg);
|
|
end;
|
|
end;
|
|
end;
|
|
|
|
|
|
|
|
begin
|
|
cmoddivnode:=tcgmoddivnode;
|
|
cunaryminusnode:=tcgunaryminusnode;
|
|
cshlshrnode:=tcgshlshrnode;
|
|
end.
|
|
{
|
|
$Log$
|
|
Revision 1.5 2002-11-25 17:43:18 peter
|
|
* splitted defbase in defutil,symutil,defcmp
|
|
* merged isconvertable and is_equal into compare_defs(_ext)
|
|
* made operator search faster by walking the list only once
|
|
|
|
Revision 1.4 2002/09/17 18:54:02 jonas
|
|
* a_load_reg_reg() now has two size parameters: source and dest. This
|
|
allows some optimizations on architectures that don't encode the
|
|
register size in the register name.
|
|
|
|
Revision 1.3 2002/08/23 16:14:48 peter
|
|
* tempgen cleanup
|
|
* tt_noreuse temp type added that will be used in genentrycode
|
|
|
|
Revision 1.2 2002/08/15 15:15:55 carl
|
|
* jmpbuf size allocation for exceptions is now cpu specific (as it should)
|
|
* more generic nodes for maths
|
|
* several fixes for better m68k support
|
|
|
|
Revision 1.1 2002/08/14 19:26:55 carl
|
|
+ generic int_to_real type conversion
|
|
+ generic unaryminus node
|
|
|
|
}
|