codetools: parse multiline string constant

This commit is contained in:
mattias 2022-03-14 16:37:55 +01:00
parent 89a9d84d34
commit e2ad6b3d8d
8 changed files with 287 additions and 46 deletions

View File

@ -0,0 +1,5 @@
<?xml version="1.0" encoding="UTF-8"?>
<CONFIG>
<Makefile Value="2"/>
<Params Value=" -Fu../../packager/units/$(CPU_TARGET)-$(OS_TARGET);../lazutils/lib/$(CPU_TARGET)-$(OS_TARGET);../freetype/lib/$(CPU_TARGET)-$(OS_TARGET);../../lcl/units/$(CPU_TARGET)-$(OS_TARGET);../../lcl/units/$(CPU_TARGET)-$(OS_TARGET)/$(LCL_PLATFORM);. -MObjFPC -Scghi -O1 -g -gl -l -vewnhibq -dLCL -dLCL$(LCL_PLATFORM) anchordockpkg.pas"/>
</CONFIG>

View File

@ -0,0 +1,5 @@
<?xml version="1.0" encoding="UTF-8"?>
<CONFIG>
<Makefile Value="2"/>
<Params Value=" -Fu../../../packager/units/$(CPU_TARGET)-$(OS_TARGET);../../lazutils/lib/$(CPU_TARGET)-$(OS_TARGET);../../buildintf/units/$(CPU_TARGET)-$(OS_TARGET);../../freetype/lib/$(CPU_TARGET)-$(OS_TARGET);../../../lcl/units/$(CPU_TARGET)-$(OS_TARGET);../../../lcl/units/$(CPU_TARGET)-$(OS_TARGET)/$(LCL_PLATFORM);../units/$(CPU_TARGET)-$(OS_TARGET)/$(LCL_PLATFORM);../../lazcontrols/lib/$(CPU_TARGET)-$(OS_TARGET)/$(LCL_PLATFORM);../../ideintf/units/$(CPU_TARGET)-$(OS_TARGET)/$(LCL_PLATFORM);. -MObjFPC -Scghi -O1 -g -gl -l -vewnhibq -dLCL -dLCL$(LCL_PLATFORM) anchordockingdsgn.pas"/>
</CONFIG>

View File

@ -1409,7 +1409,17 @@ begin
begin
inc(Result);
while (Result<=MaxPos) do begin
if (ASource[Result] in ['''',#10,#13]) then
if (ASource[Result] in ['''',#0,#10,#13]) then
break;
inc(Result);
end;
end;
'`':
begin
inc(Result);
while (Result<=MaxPos) do begin
if (ASource[Result] in ['`',#0]) then
break;
inc(Result);
end;
@ -1493,11 +1503,16 @@ begin
begin
inc(Result);
while (Result<=MaxPos) do begin
if (ASource[Result]<>'''') then
inc(Result)
else begin
inc(Result);
case ASource[Result] of
'''':
begin
inc(Result);
break;
end;
#0,#10,#13:
break;
else
inc(Result);
end;
end;
end;
@ -2106,7 +2121,7 @@ begin
inc(Src);
end;
end;
'''','#': // string constant
'''','#','`': // string constant
begin
while true do begin
case Src^ of
@ -2124,11 +2139,19 @@ begin
'''':
begin
inc(Src);
while not (Src^ in ['''',#0]) do
while not (Src^ in ['''',#0,#10,#13]) do
inc(Src);
if Src^='''' then
inc(Src);
end;
'`':
begin
inc(Src);
while not (Src^ in ['`',#0]) do
inc(Src);
if Src^='`' then
inc(Src);
end;
else
break;
end;
@ -2245,6 +2268,13 @@ var
dec(Position);
until (Position<1) or (Source[Position] in [#0,#10,#13,'''']);
end;
'`':
begin
dec(Position);
repeat
dec(Position);
until (Position<1) or (Source[Position] in [#0,'`']);
end;
'0'..'9','A'..'Z','a'..'z':
begin
// test if char constant
@ -2356,6 +2386,18 @@ var
if IsStringConstant then break;
end;
'`':
begin
// a multiline string constant -> skip it
OldPrePos:=PrePos;
while (PrePos<Position) do begin
inc(PrePos);
if Source[PrePos]='`' then
break;
end;
if IsStringConstant then break;
end;
#10,#13:
// no comment and no string constant found
break;
@ -2445,7 +2487,7 @@ begin
// read atom
if IsStringConstant then begin
Position:=OldPrePos;
if (Position>1) and (Source[Position-1]='''') then begin
if (Position>1) and (Source[Position-1] in ['''','`']) then begin
ReadStringConstantBackward;
end;
exit;
@ -2473,7 +2515,7 @@ begin
end;
end;
end;
'''':
'''','`':
begin
inc(Position);
ReadStringConstantBackward;
@ -2683,7 +2725,7 @@ begin
inc(p);
end;
end;
'''','#': // string constant
'''','#','`': // string constant
begin
while true do begin
case p^ of
@ -2696,7 +2738,14 @@ begin
'''':
begin
inc(p);
while not (p^ in ['''',#10,#13]) do
while not (p^ in ['''',#0,#10,#13]) do
inc(p);
inc(p);
end;
'`':
begin
inc(p);
while not (p^ in ['`',#0]) do
inc(p);
inc(p);
end;
@ -2819,6 +2868,20 @@ function FindStartOfAtom(const Source: string; Position: integer): integer;
until (Source[PrePos]='''');
p:=PrePos;
end;
'`':
begin
PrePos:=p;
dec(PrePos);
repeat
dec(PrePos);
if (PrePos<1) then begin
// the StartPos was the start of a string constant
p:=StartPos-1;
exit;
end;
until (Source[PrePos]='`');
p:=PrePos;
end;
'0'..'9','A'..'Z','a'..'z':
begin
// test if char constant
@ -2887,7 +2950,7 @@ begin
end;
end;
end;
'''':
'''','`':
begin
// could be start or end
inc(Result);
@ -4078,6 +4141,19 @@ begin
end;
end;
'`':
begin
inc(Result);
while (Result<=MaxPos) do begin
if (ASource[Result]<>'`') then
inc(Result)
else begin
inc(Result);
break;
end;
end;
end;
'/':
begin
inc(Result);
@ -4123,7 +4199,7 @@ var
l: Integer;
p: PChar;
begin
SetLength(Result,length(Src));
SetLength(Result{%H-},length(Src));
SrcPos:=1;
ResultPos:=1;
while SrcPos<=length(Src) do begin
@ -4453,7 +4529,7 @@ begin
end;
case p1^ of
'''':
'''','`':
// compare string constants case sensitive
exit(CompareStringConstants(p1,p2));
'{':
@ -4495,9 +4571,13 @@ end;
function CompareStringConstants(p1, p2: PChar): integer;
// 1: 'aa' 'ab' because bigger
// 1: 'aa' 'a' because longer
var
s1, s2: Char;
begin
Result := 0;
if (p1^='''') and (p2^='''') then begin
s1:=p1^;
s2:=p2^;
if (s1 in ['''','`']) and (s2 in ['''','`']) then begin
inc(p1);
inc(p2);
repeat
@ -4507,19 +4587,19 @@ begin
exit(-1); // p2 bigger
inc(p1);
inc(p2);
if p1^='''' then begin
// maybe ''
if p1^=s1 then begin
// maybe '' or ``
inc(p1);
inc(p2);
if p1^='''' then begin
if p2^='''' then begin
if p1^=s1 then begin
if p2^=s2 then begin
inc(p1);
inc(p2);
end else begin
// p1 is longer (e.g.: 'a''b' 'a')
exit(1);
end;
end else if p2^='''' then begin
end else if p2^=s2 then begin
// p2 is longer (e.g. 'a' 'a''b')
exit(-1);
end else begin
@ -4527,25 +4607,28 @@ begin
exit(0);
end;
end;
if p1^ in [#0,#10,#13] then begin
if ((s1='''') and (p1^ in [#0,#10,#13]))
or ((s1='`') and (p1^=#0)) then begin
// end of p1 found
if p2^ in [#0,#10,#13] then begin
if ((s2='''') and (p2^ in [#0,#10,#13]))
or ((s2='`') and (p2^=#0)) then begin
// same
exit(0);
end else begin
// p2 is longer
exit(-1);
end;
end else if p2^ in [#0,#10,#13] then begin
end else if ((s2='''') and (p2^ in [#0,#10,#13]))
or ((s2='`') and (p2^=#0)) then begin
// p1 is longer
exit(1);
end;
until false;
end else begin
if p1^='''' then
if p1^=s1 then
// p1 longer
exit(1)
else if p2^='''' then
else if p2^=s2 then
// p2 longer
exit(-1)
else
@ -4748,11 +4831,21 @@ begin
while (Result<=MaxPos) do begin
c:=Source[Result];
if IsIdentStartChar[c] then exit;
if c='''' then begin
// skip string constant
inc(Result);
while (Result<=MaxPos) and (not (Source[Result] in ['''',#10,#13])) do
case c of
'''':
begin
// skip string constant
inc(Result);
while (Result<=MaxPos) and (not (Source[Result] in ['''',#10,#13])) do
inc(Result);
end;
'`':
begin
// skip multiline string constant
inc(Result);
while (Result<=MaxPos) and (Source[Result]<>'`') do
inc(Result);
end;
end;
inc(Result);
end;
@ -4917,7 +5010,7 @@ var
i: Integer;
begin
if TabWidth<=0 then begin
SetLength(Result,Indent);
SetLength(Result{%H-},Indent);
if Indent>0 then
FillChar(Result[1],length(Result),' ');
end else begin
@ -5101,7 +5194,7 @@ var
l: Integer;
begin
l:=DottedIdentifierLength(Identifier);
SetLength(Result,l);
SetLength(Result{%H-},l);
if l>0 then
System.Move(Identifier^,Result[1],l);
end;
@ -5182,7 +5275,7 @@ var CodePos, ResultPos, CodeLen, SpaceEndPos: integer;
c1, c2: char;
begin
CodeLen:=length(ACode);
SetLength(Result,CodeLen);
SetLength(Result{%H-},CodeLen);
CodePos:=1;
ResultPos:=1;
while CodePos<=CodeLen do begin

View File

@ -2044,7 +2044,7 @@ begin
// first read and compute needed length
ReadIt;
// allocate space and copy tokens
SetLength(s,p-1);
SetLength(s{%H-},p-1);
ReadIt;
Result:=s;
end;

View File

@ -881,7 +881,7 @@ var
begin
if (CurPos.StartPos<1) or (CurPos.StartPos>SrcLen) then exit(false);
p:=@Src[CurPos.StartPos];
Result:=(p^ in ['''','#']) or ((p^='^') and (p[1] in ['A'..'Z']));
Result:=(p^ in ['''','#','`']) or ((p^='^') and (p[1] in ['A'..'Z']));
end;
function TCustomCodeTool.AtomIsCharConstant: boolean;
@ -922,6 +922,20 @@ begin
end;
end;
'`':
begin
inc(p);
if p^='`' then begin
// could be ````
if (p[1]<>'`') or (p[2]<>'`') then exit;
inc(p,3);
end else begin
// could be `a`
if p[1]<>'`' then exit;
inc(p,2);
end;
end;
'^':
begin
if not (p[1] in ['A'..'Z']) then exit;
@ -930,18 +944,25 @@ begin
end;
// check that no second character is following
Result:=not (p^ in ['''','#','^']);
Result:=not (p^ in ['''','`','#','^']);
end;
end;
function TCustomCodeTool.AtomIsEmptyStringConstant: boolean;
var
p: LongInt;
c: Char;
begin
p:=CurPos.StartPos;
while (p<=SrcLen) and (Src[p]='''') do inc(p);
dec(p,CurPos.StartPos);
Result:=(p>0) and ((p and 1)=0);
if (p>SrcLen) then exit(false);
c:=Src[p];
if not (c in ['''','`']) then exit(false);
inc(p);
if (p>SrcLen) then exit(true);
if Src[p]<>c then exit(false);
inc(p);
if (p>SrcLen) then exit(true);
if Src[p] in ['''','`','#'] then exit(false);
end;
function TCustomCodeTool.LastAtomIs(BackIndex: integer;
@ -1181,7 +1202,7 @@ begin
CurPos.Flag:=cafEnd;
end;
end;
'''','#':
'''','#','`':
begin
// string constant
while true do begin
@ -1218,6 +1239,23 @@ begin
end;
end;
end;
'`':
begin
inc(p);
while true do begin
case p^ of
'`':
begin
inc(p);
break;
end;
#0:
break;
else
inc(p);
end;
end;
end;
'^':
begin
inc(p);
@ -1404,6 +1442,13 @@ var
dec(CurPos.StartPos);
until (CurPos.StartPos<1) or (Src[CurPos.StartPos] in [#0,#10,#13,'''']);
end;
'`':
begin
dec(CurPos.StartPos);
repeat
dec(CurPos.StartPos);
until (CurPos.StartPos<1) or (Src[CurPos.StartPos] in [#0,'`']);
end;
'0'..'9','A'..'Z','a'..'z':
begin
// test if char constant
@ -1515,6 +1560,29 @@ var
if IsStringConstant then break;
end;
'`':
begin
// a multiline string constant -> skip it
OldPrePos:=PrePos;
while (PrePos<CurPos.StartPos) do begin
inc(PrePos);
case Src[PrePos] of
'`':
break;
#0:
begin
// string constant right border is the line end
// -> last atom of line found
IsStringConstant:=true;
break;
end;
end;
end;
if IsStringConstant then break;
end;
#10,#13:
// no comment and no string constant found
break;
@ -1610,7 +1678,7 @@ begin
// read atom
if IsStringConstant then begin
CurPos.StartPos:=OldPrePos;
if (CurPos.StartPos>1) and (Src[CurPos.StartPos-1]='''') then begin
if (CurPos.StartPos>1) and (Src[CurPos.StartPos-1] in ['''','`']) then begin
ReadStringConstantBackward;
end;
LastAtoms.AddReverse(CurPos);
@ -1649,7 +1717,7 @@ begin
end;
end;
end;
'''':
'''','`':
begin
inc(CurPos.StartPos);
ReadStringConstantBackward;
@ -1886,6 +1954,25 @@ begin
#0,#10,#13:
break;
else
inc(p);
end;
end;
end;
'`':
begin
inc(p);
while true do begin
case p^ of
'`':
begin
inc(p);
break;
end;
#0:
break;
else
inc(p);
end;
@ -3099,7 +3186,7 @@ begin
while (CleanStartPos<=SrcLen)
and (IsIdentChar[Src[CleanStartPos+len]]) do
inc(len);
SetLength(Result,len);
SetLength(Result{%H-},len);
if len>0 then
Move(Src[CleanStartPos],Result[1],len);
end else

View File

@ -2347,7 +2347,7 @@ begin
try
WritePascalToStream(ms);
SetLength(NewSrc,ms.Size);
SetLength(NewSrc{%H-},ms.Size);
if NewSrc<>'' then begin
ms.Position:=0;
ms.Read(NewSrc[1],length(NewSrc));

View File

@ -227,7 +227,8 @@ type
cmsExternalClass, { pas2js: allow class external [pkgname] name [symbol] }
cmsIgnoreAttributes, { pas2js: ignore attributes }
cmsOmitRTTI, { pas2js: treat class section 'published' as 'public' and typeinfo does not work on symbols declared with this switch }
cmsImplicitFunctionSpecialization { infer types on calls of generic functions }
cmsImplicitFunctionSpecialization, { infer types on calls of generic functions }
cmsMultiLineStrings { pas2js: Multiline strings }
);
TCompilerModeSwitches = set of TCompilerModeSwitch;
const
@ -318,7 +319,8 @@ const
'EXTERNALCLASS',
'IGNOREATTRIBUTES',
'OMITRTTI',
'IMPLICITFUNCTIONSPECIALIZATION'
'IMPLICITFUNCTIONSPECIALIZATION',
'MULTILINESTRINGS'
);
@ -1922,7 +1924,7 @@ begin
end;
SrcPos:=p-PChar(Src)+1;
end;
'''','#':
'''','#','`':
begin
TokenType:=lsttStringConstant;
while true do begin
@ -1962,6 +1964,27 @@ begin
end;
end;
end;
'`':
begin
inc(p);
while true do begin
case p^ of
#0:
begin
SrcPos:=p-PChar(Src)+1;
if SrcPos>SrcLen then break;
inc(p);
end;
'`':
begin
inc(p);
break;
end;
else
inc(p);
end;
end;
end;
else
break;
end;
@ -4590,6 +4613,14 @@ begin
if p^='''' then
inc(p);
end;
'`':
begin
// skip multiline string constant
inc(p);
while not (p^ in ['`',#0]) do inc(p);
if p^='`' then
inc(p);
end;
#0:
begin
// FPC allows that corresponding IFDEF and ENDIF are in different files

View File

@ -56,6 +56,7 @@ type
procedure TestParseProcAnoArg;
procedure TestParseProcAnoArgSubFunc;
procedure TestParseThreadVar;
procedure TestParseMultilineString;
end;
implementation
@ -614,6 +615,25 @@ begin
ParseModule;
end;
procedure TTestPascalParser.TestParseMultilineString;
begin
Add([
'program test1;',
'{$modeswitch multilinestrings}',
'const',
' s = `First',
'Second',
'Third`;',
' a = ``;',
' b = `',
'`#10`',
'line`;',
' c = ''''``;',
'begin',
'']);
ParseModule;
end;
initialization
RegisterTest(TTestPascalParser);