{ Copyright (c) 1998-2002 by Carl Eric Codere and Peter Vreman Does the parsing for the ARM GNU AS styled inline assembler. This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 2 of the License, or (at your option) any later version. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with this program; if not, write to the Free Software Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. **************************************************************************** } Unit raarmgas; {$i fpcdefs.inc} Interface uses raatt,raarm, cpubase; type tarmattreader = class(tattreader) actoppostfix : TOpPostfix; function is_asmopcode(const s: string):boolean;override; function is_register(const s:string):boolean;override; procedure handleopcode;override; procedure BuildReference(oper : tarmoperand); procedure BuildOperand(oper : tarmoperand); function TryBuildShifterOp(oper : tarmoperand) : boolean; procedure BuildOpCode(instr : tarminstruction); procedure ReadSym(oper : tarmoperand); procedure ConvertCalljmp(instr : tarminstruction); end; Implementation uses { helpers } cutils, { global } globtype,globals,verbose, systems, { aasm } cpuinfo,aasmbase,aasmtai,aasmcpu, { symtable } symconst,symbase,symtype,symsym,symtable, { parser } scanner, procinfo, itcpugas, rabase,rautils, cgbase,cgobj ; function tarmattreader.is_register(const s:string):boolean; type treg2str = record name : string[2]; reg : tregister; end; const extraregs : array[0..19] of treg2str = ( (name: 'A1'; reg : NR_R0), (name: 'A2'; reg : NR_R1), (name: 'A3'; reg : NR_R2), (name: 'A4'; reg : NR_R3), (name: 'V1'; reg : NR_R4), (name: 'V2'; reg : NR_R5), (name: 'V3'; reg : NR_R6), (name: 'V4'; reg : NR_R7), (name: 'V5'; reg : NR_R8), (name: 'V6'; reg : NR_R9), (name: 'V7'; reg : NR_R10), (name: 'V8'; reg : NR_R11), (name: 'WR'; reg : NR_R7), (name: 'SB'; reg : NR_R9), (name: 'SL'; reg : NR_R10), (name: 'FP'; reg : NR_R11), (name: 'IP'; reg : NR_R12), (name: 'SP'; reg : NR_R13), (name: 'LR'; reg : NR_R14), (name: 'PC'; reg : NR_R15)); var i : longint; begin result:=inherited is_register(s); { reg found? possible aliases are always 2 char } if result or (length(s)<>2) then exit; for i:=low(extraregs) to high(extraregs) do begin if s=extraregs[i].name then begin actasmregister:=extraregs[i].reg; result:=true; actasmtoken:=AS_REGISTER; exit; end; end; end; procedure tarmattreader.ReadSym(oper : tarmoperand); var tempstr : string; typesize,l,k : longint; begin tempstr:=actasmpattern; Consume(AS_ID); { typecasting? } if (actasmtoken=AS_LPAREN) and SearchType(tempstr,typesize) then begin oper.hastype:=true; Consume(AS_LPAREN); BuildOperand(oper); Consume(AS_RPAREN); if oper.opr.typ in [OPR_REFERENCE,OPR_LOCAL] then oper.SetSize(typesize,true); end else if not oper.SetupVar(tempstr,false) then Message1(sym_e_unknown_id,tempstr); { record.field ? } if actasmtoken=AS_DOT then begin BuildRecordOffsetSize(tempstr,l,k); inc(oper.opr.ref.offset,l); end; end; Procedure tarmattreader.BuildReference(oper : tarmoperand); procedure Consume_RBracket; begin if actasmtoken<>AS_RBRACKET then Begin Message(asmr_e_invalid_reference_syntax); RecoverConsume(true); end else begin Consume(AS_RBRACKET); if not (actasmtoken in [AS_COMMA,AS_SEPARATOR,AS_END]) then Begin Message(asmr_e_invalid_reference_syntax); RecoverConsume(true); end; end; end; procedure read_index; begin Consume(AS_COMMA); if actasmtoken=AS_REGISTER then Begin oper.opr.ref.index:=actasmregister; Consume(AS_REGISTER); end else if actasmtoken=AS_HASH then begin Consume(AS_HASH); inc(oper.opr.ref.offset,BuildConstExpression(false,true)); end; end; begin Consume(AS_LBRACKET); if actasmtoken=AS_REGISTER then begin oper.opr.ref.base:=actasmregister; Consume(AS_REGISTER); { can either be a register or a right parenthesis } { (reg) } if actasmtoken=AS_RBRACKET then Begin Consume_RBracket; oper.opr.ref.addressmode:=AM_POSTINDEXED; if actasmtoken=AS_COMMA then read_index; exit; end; if actasmtoken=AS_COMMA then begin read_index; Consume_RBracket; end; if actasmtoken=AS_NOT then begin consume(AS_NOT); oper.opr.ref.addressmode:=AM_PREINDEXED; end; end {end case } else Begin Message(asmr_e_invalid_reference_syntax); RecoverConsume(false); end; end; function tarmattreader.TryBuildShifterOp(oper : tarmoperand) : boolean; procedure handlepara(sm : tshiftmode); begin consume(AS_ID); fillchar(oper.opr,sizeof(oper.opr),0); oper.opr.typ:=OPR_SHIFTEROP; oper.opr.shifterop.shiftmode:=sm; if sm<>SM_RRX then begin case actasmtoken of AS_REGISTER: begin oper.opr.shifterop.rs:=actasmregister; consume(AS_REGISTER); end; AS_HASH: begin consume(AS_HASH); oper.opr.shifterop.shiftimm:=BuildConstExpression(false,false); end; else Message(asmr_e_illegal_shifterop_syntax); end; end; end; begin result:=true; if (actasmtoken=AS_ID) then begin if (actasmpattern='LSL') then handlepara(SM_LSL) else if (actasmpattern='LSR') then handlepara(SM_LSR) else if (actasmpattern='ASR') then handlepara(SM_ASR) else if (actasmpattern='ROR') then handlepara(SM_ROR) else if (actasmpattern='RRX') then handlepara(SM_ROR) else result:=false; end else result:=false; end; Procedure tarmattreader.BuildOperand(oper : tarmoperand); var expr : string; typesize,l : longint; procedure AddLabelOperand(hl:tasmlabel); begin if not(actasmtoken in [AS_PLUS,AS_MINUS,AS_LPAREN]) and is_calljmp(actopcode) then begin oper.opr.typ:=OPR_SYMBOL; oper.opr.symbol:=hl; end else begin oper.InitRef; oper.opr.ref.symbol:=hl; end; end; procedure MaybeRecordOffset; var hasdot : boolean; l, toffset, tsize : longint; begin if not(actasmtoken in [AS_DOT,AS_PLUS,AS_MINUS]) then exit; l:=0; hasdot:=(actasmtoken=AS_DOT); if hasdot then begin if expr<>'' then begin BuildRecordOffsetSize(expr,toffset,tsize); inc(l,toffset); oper.SetSize(tsize,true); end; end; if actasmtoken in [AS_PLUS,AS_MINUS] then inc(l,BuildConstExpression(true,false)); case oper.opr.typ of OPR_LOCAL : begin { don't allow direct access to fields of parameters, because that will generate buggy code. Allow it only for explicit typecasting } if hasdot and (not oper.hastype) and (tabstractnormalvarsym(oper.opr.localsym).owner.symtabletype=parasymtable) and (current_procinfo.procdef.proccalloption<>pocall_register) then Message(asmr_e_cannot_access_field_directly_for_parameters); inc(oper.opr.localsymofs,l) end; OPR_CONSTANT : inc(oper.opr.val,l); OPR_REFERENCE : inc(oper.opr.ref.offset,l); else internalerror(200309221); end; end; function MaybeBuildReference:boolean; { Try to create a reference, if not a reference is found then false is returned } begin MaybeBuildReference:=true; case actasmtoken of AS_INTNUM, AS_MINUS, AS_PLUS: Begin oper.opr.ref.offset:=BuildConstExpression(True,False); if actasmtoken<>AS_LPAREN then Message(asmr_e_invalid_reference_syntax) else BuildReference(oper); end; AS_LPAREN: BuildReference(oper); AS_ID: { only a variable is allowed ... } Begin ReadSym(oper); case actasmtoken of AS_END, AS_SEPARATOR, AS_COMMA: ; AS_LPAREN: BuildReference(oper); else Begin Message(asmr_e_invalid_reference_syntax); Consume(actasmtoken); end; end; {end case } end; else MaybeBuildReference:=false; end; { end case } end; var tempreg : tregister; ireg : tsuperregister; hl : tasmlabel; ofs : longint; registerset : tcpuregisterset; Begin expr:=''; case actasmtoken of AS_LBRACKET: { Memory reference or constant expression } Begin oper.InitRef; BuildReference(oper); end; AS_HASH: { Constant expression } Begin Consume(AS_HASH); BuildConstantOperand(oper); end; (* AS_INTNUM, AS_MINUS, AS_PLUS: Begin { Constant memory offset } { This must absolutely be followed by ( } oper.InitRef; oper.opr.ref.offset:=BuildConstExpression(True,False); if actasmtoken<>AS_LPAREN then begin ofs:=oper.opr.ref.offset; BuildConstantOperand(oper); inc(oper.opr.val,ofs); end else BuildReference(oper); end; *) AS_ID: { A constant expression, or a Variable ref. } Begin { Local Label ? } if is_locallabel(actasmpattern) then begin CreateLocalLabel(actasmpattern,hl,false); Consume(AS_ID); AddLabelOperand(hl); end else { Check for label } if SearchLabel(actasmpattern,hl,false) then begin Consume(AS_ID); AddLabelOperand(hl); end else { probably a variable or normal expression } { or a procedure (such as in CALL ID) } Begin { is it a constant ? } if SearchIConstant(actasmpattern,l) then Begin if not (oper.opr.typ in [OPR_NONE,OPR_CONSTANT]) then Message(asmr_e_invalid_operand_type); BuildConstantOperand(oper); end else begin expr:=actasmpattern; Consume(AS_ID); { typecasting? } if (actasmtoken=AS_LPAREN) and SearchType(expr,typesize) then begin oper.hastype:=true; Consume(AS_LPAREN); BuildOperand(oper); Consume(AS_RPAREN); if oper.opr.typ in [OPR_REFERENCE,OPR_LOCAL] then oper.SetSize(typesize,true); end else begin if not(oper.SetupVar(expr,false)) then Begin { look for special symbols ... } if expr= '__HIGH' then begin consume(AS_LPAREN); if not oper.setupvar('high'+actasmpattern,false) then Message1(sym_e_unknown_id,'high'+actasmpattern); consume(AS_ID); consume(AS_RPAREN); end else if expr = '__RESULT' then oper.SetUpResult else if expr = '__SELF' then oper.SetupSelf else if expr = '__OLDEBP' then oper.SetupOldEBP else Message1(sym_e_unknown_id,expr); end; end; end; if actasmtoken=AS_DOT then MaybeRecordOffset; { add a constant expression? } if (actasmtoken=AS_PLUS) then begin l:=BuildConstExpression(true,false); case oper.opr.typ of OPR_CONSTANT : inc(oper.opr.val,l); OPR_LOCAL : inc(oper.opr.localsymofs,l); OPR_REFERENCE : inc(oper.opr.ref.offset,l); else internalerror(200309202); end; end end; { Do we have a indexing reference, then parse it also } if actasmtoken=AS_LPAREN then BuildReference(oper); end; { Register, a variable reference or a constant reference } AS_REGISTER: Begin { save the type of register used. } tempreg:=actasmregister; Consume(AS_REGISTER); if (actasmtoken in [AS_END,AS_SEPARATOR,AS_COMMA]) then Begin if not (oper.opr.typ in [OPR_NONE,OPR_REGISTER]) then Message(asmr_e_invalid_operand_type); oper.opr.typ:=OPR_REGISTER; oper.opr.reg:=tempreg; end else if (actasmtoken=AS_NOT) and (actopcode in [A_LDM,A_STM]) then begin consume(AS_NOT); oper.opr.typ:=OPR_REFERENCE; oper.opr.ref.addressmode:=AM_PREINDEXED; oper.opr.ref.index:=tempreg; end else Message(asmr_e_syn_operand); end; { Registerset } AS_LSBRACKET: begin consume(AS_LSBRACKET); registerset:=[]; while true do begin if actasmtoken=AS_REGISTER then begin include(registerset,getsupreg(actasmregister)); tempreg:=actasmregister; consume(AS_REGISTER); if actasmtoken=AS_MINUS then begin consume(AS_MINUS); for ireg:=getsupreg(tempreg) to getsupreg(actasmregister) do include(registerset,ireg); consume(AS_REGISTER); end; end else consume(AS_REGISTER); if actasmtoken=AS_COMMA then consume(AS_COMMA) else break; end; consume(AS_RSBRACKET); oper.opr.typ:=OPR_REGSET; oper.opr.regset:=registerset; end; AS_END, AS_SEPARATOR, AS_COMMA: ; else Begin Message(asmr_e_syn_operand); Consume(actasmtoken); end; end; { end case } end; {***************************************************************************** tarmattreader *****************************************************************************} procedure tarmattreader.BuildOpCode(instr : tarminstruction); var operandnum : longint; Begin { opcode } if (actasmtoken<>AS_OPCODE) then Begin Message(asmr_e_invalid_or_missing_opcode); RecoverConsume(true); exit; end; { Fill the instr object with the current state } with instr do begin Opcode:=ActOpcode; condition:=ActCondition; oppostfix:=actoppostfix; end; { We are reading operands, so opcode will be an AS_ID } operandnum:=1; Consume(AS_OPCODE); { Zero operand opcode ? } if actasmtoken in [AS_SEPARATOR,AS_END] then begin operandnum:=0; exit; end; { Read the operands } repeat case actasmtoken of AS_COMMA: { Operand delimiter } Begin if ((instr.opcode=A_MOV) and (operandnum=2)) or ((operandnum=3) and not(instr.opcode in [A_UMLAL,A_UMULL,A_SMLAL,A_SMULL])) then begin Consume(AS_COMMA); if not(TryBuildShifterOp(instr.Operands[4] as tarmoperand)) then Message(asmr_e_illegal_shifterop_syntax); Inc(operandnum); end else begin if operandnum>Max_Operands then Message(asmr_e_too_many_operands) else Inc(operandnum); Consume(AS_COMMA); end; end; AS_SEPARATOR, AS_END : { End of asm operands for this opcode } begin break; end; else BuildOperand(instr.Operands[operandnum] as tarmoperand); end; { end case } until false; instr.Ops:=operandnum; end; function tarmattreader.is_asmopcode(const s: string):boolean; const { sorted by length so longer postfixes will match first } postfix2strsorted : array[1..19] of string[2] = ( 'EP','SB','BT','SH', 'IA','IB','DA','DB','FD','FA','ED','EA', 'B','D','E','P','T','H','S'); postfixsorted : array[1..19] of TOpPostfix = ( PF_EP,PF_SB,PF_BT,PF_SH, PF_IA,PF_IB,PF_DA,PF_DB,PF_FD,PF_FA,PF_ED,PF_EA, PF_B,PF_D,PF_E,PF_P,PF_T,PF_H,PF_S); var str2opentry: tstr2opentry; len, j, sufidx : longint; hs : string; maxlen : longint; icond : tasmcond; Begin { making s a value parameter would break other assembler readers } hs:=s; is_asmopcode:=false; { clear op code } actopcode:=A_None; actcondition:=C_None; { first, handle B else BLS is read wrong } if ((hs[1]='B') and (length(hs)=3)) then begin for icond:=low(tasmcond) to high(tasmcond) do begin if copy(hs,2,3)=uppercond2str[icond] then begin actopcode:=A_B; actasmtoken:=AS_OPCODE; actcondition:=icond; is_asmopcode:=true; exit; end; end; end; maxlen:=max(length(hs),5); for j:=maxlen downto 1 do begin str2opentry:=tstr2opentry(iasmops.search(copy(hs,1,j))); if assigned(str2opentry) then begin actopcode:=str2opentry.op; actasmtoken:=AS_OPCODE; { strip op code } delete(hs,1,j); break; end; end; if not(assigned(str2opentry)) then exit; { search for condition, conditions are always 2 chars } if length(hs)>1 then begin for icond:=low(tasmcond) to high(tasmcond) do begin if copy(hs,1,2)=uppercond2str[icond] then begin actcondition:=icond; { strip condition } delete(hs,1,2); break; end; end; end; { check for postfix } if length(hs)>0 then begin for j:=low(postfixsorted) to high(postfixsorted) do begin if copy(hs,1,length(postfix2strsorted[j]))=postfix2strsorted[j] then begin actoppostfix:=postfixsorted[j]; { strip postfix } delete(hs,1,length(postfix2strsorted[j])); break; end; end; end; { if we stripped all postfixes, it's a valid opcode } is_asmopcode:=length(hs)=0; end; procedure tarmattreader.ConvertCalljmp(instr : tarminstruction); var newopr : toprrec; begin if instr.Operands[1].opr.typ=OPR_REFERENCE then begin newopr.typ:=OPR_SYMBOL; newopr.symbol:=instr.Operands[1].opr.ref.symbol; newopr.symofs:=instr.Operands[1].opr.ref.offset; if (instr.Operands[1].opr.ref.base<>NR_NO) or (instr.Operands[1].opr.ref.index<>NR_NO) then Message(asmr_e_syn_operand); instr.Operands[1].opr:=newopr; end; end; procedure tarmattreader.handleopcode; var instr : tarminstruction; begin instr:=TarmInstruction.Create(TarmOperand); BuildOpcode(instr); if is_calljmp(instr.opcode) then ConvertCalljmp(instr); { instr.AddReferenceSizes; instr.SetInstructionOpsize; instr.CheckOperandSizes; } instr.ConcatInstruction(curlist); instr.Free; actoppostfix:=PF_None; end; {***************************************************************************** Initialize *****************************************************************************} const asmmode_arm_att_info : tasmmodeinfo = ( id : asmmode_arm_gas; idtxt : 'GAS'; casmreader : tarmattreader; ); asmmode_arm_standard_info : tasmmodeinfo = ( id : asmmode_standard; idtxt : 'STANDARD'; casmreader : tarmattreader; ); initialization RegisterAsmMode(asmmode_arm_att_info); RegisterAsmMode(asmmode_arm_standard_info); end.