fpc/compiler/llvm/llvmpara.pas
Jonas Maebe 2949d0b548 LLVM: only add sret attribute for first parameter on caller side
We already did this when generating the definitions, but not yet
when generating the calls
2023-07-30 22:22:28 +02:00

358 lines
13 KiB
ObjectPascal

{
Copyright (c) 2013 by Jonas Maebe
Includes the llvm parameter manager
This program is free software; you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation; either version 2 of the License, or
(at your option) any later version.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with this program; if not, write to the Free Software
Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
****************************************************************************
}
unit llvmpara;
{$i fpcdefs.inc}
interface
uses
globtype,aasmdata,
symconst,symtype,symdef,symsym,
parabase,cgbase,
cpupara;
type
{ LLVM stands for "low level code generator", and regarding parameter
handling it is indeed very low level. We are responsible for decomposing
aggregate parameters into multiple simple parameters in case they have
to be passed in special registers (such as floating point or SSE), and
also for indicating whether e.g. 8 bit parameters need to be sign or
zero exntended. This corresponds to pretty much what we do when creating
parameter locations, so we reuse the original parameter manager and then
process its output.
The future will tell whether we can do this without
architecture-specific code, or whether we will have to integrate parts
into the various tcpuparamanager classes }
tllvmparamanager = class(tcpuparamanager)
function push_addr_param(varspez: tvarspez; def: tdef; calloption: tproccalloption): boolean; override;
procedure getcgtempparaloc(list: TAsmList; pd: tabstractprocdef; nr: longint; var cgpara: tcgpara); override;
function param_use_paraloc(const cgpara: tcgpara): boolean; override;
procedure createtempparaloc(list: TAsmList; calloption: tproccalloption; parasym: tparavarsym; can_use_final_stack_loc: boolean; var cgpara: TCGPara); override;
function create_paraloc_info(p: tabstractprocdef; side: tcallercallee): longint; override;
function create_varargs_paraloc_info(p: tabstractprocdef; side: tcallercallee; varargspara: tvarargsparalist): longint; override;
function get_funcretloc(p: tabstractprocdef; side: tcallercallee; forcetempdef: tdef): tcgpara; override;
function has_strict_proc_signature: boolean; override;
private
procedure create_paraloc_info_internllvm(p: tabstractprocdef; side: tcallercallee);
procedure set_llvm_paraloc_name(p: tabstractprocdef; hp: tparavarsym; var para: tcgpara);
procedure add_llvm_callee_paraloc_names(p: tabstractprocdef);
procedure reducetosingleregparaloc(paraloc: PCGParaLocation; def: tdef; reg: tregister);
procedure reduceparalocs(p: tabstractprocdef; side: tcallercallee; paras: tparalist);
end;
implementation
uses
verbose,
aasmbase,
llvmsym,
paramgr,defutil,llvmdef,
cgutils,tgobj,hlcgobj;
{ tllvmparamanager }
function tllvmparamanager.push_addr_param(varspez: tvarspez; def: tdef; calloption: tproccalloption): boolean;
begin
if def<>llvm_metadatatype then
begin
result:=inherited;
exit;
end;
result:=false;
end;
procedure tllvmparamanager.getcgtempparaloc(list: TAsmList; pd: tabstractprocdef; nr: longint; var cgpara: tcgpara);
begin
if (nr<1) or (nr>pd.paras.count) then
InternalError(2015040402);
pd.init_paraloc_info(callerside);
createtempparaloc(list,pd.proccalloption,tparavarsym(pd.paras[nr-1]),true,cgpara);
end;
function tllvmparamanager.param_use_paraloc(const cgpara: tcgpara): boolean;
begin
{ we can use the paraloc on the callee side if the SSA property is
guaranteed, i.e., if it is a constant location (and if it's not been
split up into multiple locations for ABI reasons). We can't deduce that
from the paraloc though, we need the parasym for that. Potential
future optimisation, although llvm will probably optimise away the
temps we create anyway }
result:=false;
end;
procedure tllvmparamanager.reducetosingleregparaloc(paraloc: PCGParaLocation; def: tdef; reg: tregister);
var
nextloc: pcgparalocation;
begin
paraloc^.def:=def;
paraloc^.size:=def_cgsize(def);
paraloc^.register:=reg;
paraloc^.shiftval:=0;
{ remove all other paralocs }
while assigned(paraloc^.next) do
begin
nextloc:=paraloc^.next;
paraloc^.next:=nextloc^.next;
dispose(nextloc);
end;
end;
procedure tllvmparamanager.reduceparalocs(p: tabstractprocdef; side: tcallercallee; paras: tparalist);
var
paranr: longint;
hp: tparavarsym;
paraloc: PCGParaLocation;
begin
for paranr:=0 to paras.count-1 do
begin
hp:=tparavarsym(paras[paranr]);
paraloc:=hp.paraloc[side].location;
if assigned(paraloc) then
begin
if assigned(paraloc^.next) and
(hp.paraloc[side].def.typ in [orddef,enumdef,floatdef]) then
begin
if not(paraloc^.loc in [LOC_REGISTER,LOC_FPUREGISTER,LOC_MMREGISTER]) then
internalerror(2019011902);
reducetosingleregparaloc(paraloc,hp.paraloc[side].def,paraloc^.register);
end
else if paraloc^.def=llvm_metadatatype then
begin
paraloc^.Loc:=LOC_REGISTER;
// will be overwritten with a "register" whose superregister is an index in the LLVM metadata table
paraloc^.register:=NR_INVALID;
end;
end;
end;
end;
procedure tllvmparamanager.createtempparaloc(list: TAsmList; calloption: tproccalloption; parasym: tparavarsym; can_use_final_stack_loc: boolean; var cgpara: TCGPara);
var
paraloc: pcgparalocation;
paralocdef: tdef;
begin
inherited;
paraloc:=cgpara.location;
{ No need to set paraloc^.llvmloc.*, these are not used/needed for temp
paralocs }
while assigned(paraloc) do
begin
if (vo_is_funcret in parasym.varoptions) and
{ sret attribute is only valid for the first parameter; sometimes
FPC will place other parameters first (e.g. self), and then
we can't use it; we use other attributes in that case to
approximate the optimisations that LLVM can do for sret }
(tabstractprocdef(parasym.owner.defowner).paras[0] = parasym)
{$ifdef aarch64}
{ see AArch64's tcpuparamanager.create_paraloc_info_intern() }
and not is_managed_type(parasym.vardef)
{$endif aarch64}
then
paraloc^.retvalloc:=true;
{ ordinal parameters must be passed as a single paraloc }
if (cgpara.def.typ in [orddef,enumdef,floatdef]) and
assigned(paraloc^.next) then
begin
paraloc^.loc:=LOC_REGISTER;
reducetosingleregparaloc(paraloc,cgpara.def,hlcg.getintregister(list,cgpara.def));
end;
{ varargs parameters do not have a parasym.owner, but they're always
by value }
if (assigned(parasym.owner) and
paramanager.push_addr_param(parasym.varspez,parasym.vardef,tabstractprocdef(parasym.owner.defowner).proccalloption)) or
not llvmbyvalparaloc(paraloc) then
begin
case paraloc^.loc of
LOC_REFERENCE:
begin
case hlcg.def2regtyp(paraloc^.def) of
R_INTREGISTER,
R_ADDRESSREGISTER:
paraloc^.loc:=LOC_REGISTER;
R_FPUREGISTER:
paraloc^.loc:=LOC_FPUREGISTER;
R_MMREGISTER:
paraloc^.Loc:=LOC_MMREGISTER;
else
internalerror(2013012308);
end;
paraloc^.register:=hlcg.getregisterfordef(list,paraloc^.def);
paraloc^.llvmvalueloc:=true;
{ paraloc^.reference overlaid this field, so zero it now
that we turned it into a register location }
paraloc^.shiftval:=0;
end;
LOC_REGISTER,
LOC_FPUREGISTER,
LOC_MMREGISTER:
begin
paraloc^.llvmvalueloc:=true;
end;
LOC_VOID:
begin
{ for empty records, ensure these don't get a byval
attribute }
paraloc^.llvmvalueloc:=true;
end;
else
internalerror(2014012302);
end;
end
else
begin
{ turn this paraloc into the "byval" parameter: at the llvm level,
a pointer to the value that it should place on the stack (or
passed in registers, in some cases) }
paraloc^.llvmvalueloc:=false;
paraloc^.loc:=LOC_REGISTER;
paralocdef:=cpointerdef.getreusable_no_free(paraloc^.def);
reducetosingleregparaloc(paraloc,paralocdef,hlcg.getaddressregister(list,paralocdef));
end;
paraloc^.llvmloc.loc:=paraloc^.loc;
paraloc^.llvmloc.reg:=paraloc^.register;
paraloc:=paraloc^.next;
end;
end;
function tllvmparamanager.create_paraloc_info(p: tabstractprocdef; side: tcallercallee): longint;
begin
result:=inherited;
create_paraloc_info_internllvm(p,side);
end;
function tllvmparamanager.create_varargs_paraloc_info(p: tabstractprocdef; side: tcallercallee; varargspara: tvarargsparalist): longint;
begin
result:=inherited;
create_paraloc_info_internllvm(p,side);
if assigned(varargspara) then
reduceparalocs(p,side,varargspara);
end;
function tllvmparamanager.get_funcretloc(p: tabstractprocdef; side: tcallercallee; forcetempdef: tdef): tcgpara;
var
paraloc: pcgparalocation;
begin
result:=inherited;
paraloc:=result.location;
repeat
paraloc^.llvmvalueloc:=true;
paraloc:=paraloc^.next;
until not assigned(paraloc);
paraloc:=result.location;
if assigned(paraloc^.next) and
(result.def.typ in [orddef,enumdef,floatdef]) and
((side=callerside) or
not(po_assembler in p.procoptions)) then
begin
if not(paraloc^.loc in [LOC_REGISTER,LOC_FPUREGISTER,LOC_MMREGISTER]) then
internalerror(2019011901);
reducetosingleregparaloc(paraloc,result.def,paraloc^.register);
end;
end;
function tllvmparamanager.has_strict_proc_signature: boolean;
begin
result:=true;
end;
procedure tllvmparamanager.create_paraloc_info_internllvm(p: tabstractprocdef; side: tcallercallee);
begin
{ on the calleeside, llvm declares the parameters similar to Pascal or C
(a list of parameters and their types), but they correspond more
closely to parameter locations than to parameters -> add names to the
locations }
if (side=calleeside) and
not(po_assembler in p.procoptions) then
begin
add_llvm_callee_paraloc_names(p);
reduceparalocs(p,side,p.paras);
end
else if side=callerside then
begin
reduceparalocs(p,side,p.paras);
end;
end;
{ hp non-nil: parasym to check
hp nil: function result
}
procedure tllvmparamanager.set_llvm_paraloc_name(p: tabstractprocdef; hp: tparavarsym; var para: tcgpara);
var
paraloc: PCGParaLocation;
paralocnr: longint;
begin
paraloc:=hp.paraloc[calleeside].location;
paralocnr:=0;
repeat
paraloc^.llvmloc.loc:=LOC_REFERENCE;
paraloc^.llvmloc.sym:=current_asmdata.DefineAsmSymbol(llvmparaname(hp,paralocnr),AB_TEMP,AT_DATA,paraloc^.def);
{ byval: a pointer to a type that should actually be passed by
value (e.g. a record that should be passed on the stack) }
paraloc^.llvmvalueloc:=
paramanager.push_addr_param(hp.varspez,hp.vardef,p.proccalloption) or
not llvmbyvalparaloc(paraloc);
paraloc:=paraloc^.next;
inc(paralocnr);
until not assigned(paraloc);
end;
procedure tllvmparamanager.add_llvm_callee_paraloc_names(p: tabstractprocdef);
var
paranr: longint;
hp: tparavarsym;
begin
for paranr:=0 to p.paras.count-1 do
begin
hp:=tparavarsym(p.paras[paranr]);
set_llvm_paraloc_name(p,hp,hp.paraloc[calleeside]);
end;
end;
begin
if not assigned(paramanager) then
begin
writeln('Internalerror 2018052006');
halt(1);
end;
{ replace the native parameter manager. Maybe this has to be moved to a
procedure like the creations of the code generators, but possibly not since
we still call the original paramanager }
paramanager.free;
paramanager:=tllvmparamanager.create;
end.