mirror of
				https://gitlab.com/freepascal.org/fpc/source.git
				synced 2025-10-26 02:01:34 +02:00 
			
		
		
		
	
		
			
				
	
	
		
			497 lines
		
	
	
		
			10 KiB
		
	
	
	
		
			PHP
		
	
	
	
	
	
			
		
		
	
	
			497 lines
		
	
	
		
			10 KiB
		
	
	
	
		
			PHP
		
	
	
	
	
	
| {
 | |
|     This file is part of the Free Component Library (FCL)
 | |
|     Copyright (c) 1999-2007 by the Free Pascal development team
 | |
| 
 | |
|     See the file COPYING.FPC, included in this distribution,
 | |
|     for details about the copyright.
 | |
| 
 | |
|     This program is distributed in the hope that it will be useful,
 | |
|     but WITHOUT ANY WARRANTY; without even the implied warranty of
 | |
|     MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
 | |
| 
 | |
|  **********************************************************************}
 | |
| 
 | |
| {****************************************************************************}
 | |
| {*                             TParser                                      *}
 | |
| {****************************************************************************}
 | |
| 
 | |
| const
 | |
|   ParseBufSize     = 4096;
 | |
|   LastSpecialToken = 5;
 | |
| 
 | |
|   TokNames : array[0..LastSpecialToken] of string =
 | |
|   (
 | |
|     'EOF',
 | |
|     'Symbol',
 | |
|     'String',
 | |
|     'Integer',
 | |
|     'Float',
 | |
|     'WideString'
 | |
|   );
 | |
| 
 | |
| function TParser.GetTokenName(aTok: char): string;
 | |
| begin
 | |
|   if ord(aTok) <= LastSpecialToken then
 | |
|     Result:=TokNames[ord(aTok)]
 | |
|   else Result:=aTok;
 | |
| end;
 | |
| 
 | |
| procedure TParser.LoadBuffer;
 | |
| var
 | |
|   BytesRead: integer;
 | |
| begin
 | |
|   BytesRead := FStream.Read(FBuf^, ParseBufSize);
 | |
|   if BytesRead = 0 then
 | |
|   begin
 | |
|     FEofReached := True;
 | |
|     Exit;
 | |
|   end;
 | |
|   FBuf[BytesRead] := #0;
 | |
|   Inc(FDeltaPos, BytesRead);
 | |
|   FPos := 0;
 | |
|   FBufLen := BytesRead;
 | |
| end;
 | |
| 
 | |
| procedure TParser.CheckLoadBuffer; {$ifdef CLASSESINLINE} inline; {$endif CLASSESINLINE}
 | |
| begin
 | |
|   if fBuf[fPos]=#0 then LoadBuffer;
 | |
| end;
 | |
| 
 | |
| procedure TParser.ProcessChar; {$ifdef CLASSESINLINE} inline; {$endif CLASSESINLINE}
 | |
| begin
 | |
|   fLastTokenStr:=fLastTokenStr+fBuf[fPos];
 | |
|   inc(fPos);
 | |
|   CheckLoadBuffer;
 | |
| end;
 | |
| 
 | |
| function TParser.IsNumber: boolean; {$ifdef CLASSESINLINE} inline; {$endif CLASSESINLINE}
 | |
| begin
 | |
|   Result:=fBuf[fPos] in ['0'..'9'];
 | |
| end;
 | |
| 
 | |
| function TParser.IsHexNum: boolean; {$ifdef CLASSESINLINE} inline; {$endif CLASSESINLINE}
 | |
| begin
 | |
|   Result:=fBuf[fPos] in ['0'..'9','A'..'F','a'..'f'];
 | |
| end;
 | |
| 
 | |
| function TParser.IsAlpha: boolean; {$ifdef CLASSESINLINE} inline; {$endif CLASSESINLINE}
 | |
| begin
 | |
|   Result:=fBuf[fPos] in ['_','A'..'Z','a'..'z'];
 | |
| end;
 | |
| 
 | |
| function TParser.IsAlphaNum: boolean; {$ifdef CLASSESINLINE} inline; {$endif CLASSESINLINE}
 | |
| begin
 | |
|   Result:=IsAlpha or IsNumber;
 | |
| end;
 | |
| 
 | |
| function TParser.GetHexValue(c: char): byte; {$ifdef CLASSESINLINE} inline; {$endif CLASSESINLINE}
 | |
| begin
 | |
|   case c of
 | |
|     '0'..'9' : Result:=ord(c)-$30;
 | |
|     'A'..'F' : Result:=ord(c)-$37; //-$41+$0A
 | |
|     'a'..'f' : Result:=ord(c)-$57; //-$61+$0A
 | |
|   end;
 | |
| end;
 | |
| 
 | |
| function TParser.GetAlphaNum: string;
 | |
| begin
 | |
|   if not IsAlpha then
 | |
|     ErrorFmt(SParExpected,[GetTokenName(toSymbol)]);
 | |
|   Result:='';
 | |
|   while IsAlphaNum do
 | |
|   begin
 | |
|     Result:=Result+fBuf[fPos];
 | |
|     inc(fPos);
 | |
|     CheckLoadBuffer;
 | |
|   end;
 | |
| end;
 | |
| 
 | |
| procedure TParser.HandleNewLine;
 | |
| begin
 | |
|   if fBuf[fPos]=#13 then //CR
 | |
|   begin
 | |
|     inc(fPos);
 | |
|     CheckLoadBuffer;
 | |
|     if fBuf[fPos]=#10 then inc(fPos); //CR LF
 | |
|   end
 | |
|   else inc(fPos); //LF
 | |
|   inc(fSourceLine);
 | |
|   fDeltaPos:=-(fPos-1);
 | |
| end;
 | |
| 
 | |
| procedure TParser.SkipBOM;
 | |
| var
 | |
|   i : integer;
 | |
|   bom : string[3];
 | |
|   backup : integer;
 | |
| begin
 | |
|   i:=1;
 | |
|   bom:='   ';
 | |
|   backup:=fPos;
 | |
|   while (fBuf[fPos] in [#$BB,#$BF,#$EF]) and (i<=3) do
 | |
|   begin
 | |
|     bom[i]:=fBuf[fPos];
 | |
|     inc(fPos);
 | |
|     inc(i);
 | |
|   end;
 | |
|   if (bom<>(#$EF+#$BB+#$BF)) then
 | |
|     fPos:=backup;
 | |
| end;
 | |
| 
 | |
| procedure TParser.SkipSpaces;
 | |
| begin
 | |
|   while fBuf[fPos] in [' ',#9] do
 | |
|     inc(fPos);
 | |
| end;
 | |
| 
 | |
| procedure TParser.SkipWhitespace;
 | |
| begin
 | |
|   while true do
 | |
|   begin
 | |
|     CheckLoadBuffer;
 | |
|     case fBuf[fPos] of
 | |
|       ' ',#9  : SkipSpaces;
 | |
|       #10,#13 : HandleNewLine
 | |
|       else break;
 | |
|     end;
 | |
|   end;
 | |
| end;
 | |
| 
 | |
| procedure TParser.HandleEof;
 | |
| begin
 | |
|   fToken:=toEOF;
 | |
|   fLastTokenStr:='';
 | |
| end;
 | |
| 
 | |
| procedure TParser.HandleAlphaNum;
 | |
| begin
 | |
|   fLastTokenStr:=GetAlphaNum;
 | |
|   fToken:=toSymbol;
 | |
| end;
 | |
| 
 | |
| procedure TParser.HandleNumber;
 | |
| type
 | |
|   floatPunct = (fpDot,fpE);
 | |
|   floatPuncts = set of floatPunct;
 | |
| var
 | |
|   allowed : floatPuncts;
 | |
| begin
 | |
|   fLastTokenStr:='';
 | |
|   while IsNumber do
 | |
|     ProcessChar;
 | |
|   fToken:=toInteger;
 | |
|   if (fBuf[fPos] in ['.','e','E']) then
 | |
|   begin
 | |
|     fToken:=toFloat;
 | |
|     allowed:=[fpDot,fpE];
 | |
|     while (fBuf[fPos] in ['.','e','E','0'..'9']) do
 | |
|     begin
 | |
|       case fBuf[fPos] of
 | |
|         '.'     : if fpDot in allowed then Exclude(allowed,fpDot) else break;
 | |
|         'E','e' : if fpE in allowed then
 | |
|                   begin
 | |
|                     allowed:=[];
 | |
|                     ProcessChar;
 | |
|                     if (fBuf[fPos] in ['+','-']) then ProcessChar;
 | |
|                     if not (fBuf[fPos] in ['0'..'9']) then
 | |
|                       ErrorFmt(SParInvalidFloat,[fLastTokenStr+fBuf[fPos]]);
 | |
|                   end
 | |
|                   else break;
 | |
|       end;
 | |
|       ProcessChar;
 | |
|     end;
 | |
|   end;
 | |
|   if (fBuf[fPos] in ['s','S','d','D','c','C']) then //single, date, currency
 | |
|   begin
 | |
|     fFloatType:=fBuf[fPos];
 | |
|     inc(fPos);
 | |
|     fToken:=toFloat;
 | |
|   end
 | |
|   else fFloatType:=#0;
 | |
| end;
 | |
| 
 | |
| procedure TParser.HandleHexNumber;
 | |
| var valid : boolean;
 | |
| begin
 | |
|   fLastTokenStr:='$';
 | |
|   inc(fPos);
 | |
|   CheckLoadBuffer;
 | |
|   valid:=false;
 | |
|   while IsHexNum do
 | |
|   begin
 | |
|     valid:=true;
 | |
|     ProcessChar;
 | |
|   end;
 | |
|   if not valid then
 | |
|     ErrorFmt(SParInvalidInteger,[fLastTokenStr]);
 | |
|   fToken:=toInteger;
 | |
| end;
 | |
| 
 | |
| function TParser.HandleQuotedString: string;
 | |
| begin
 | |
|   Result:='';
 | |
|   inc(fPos);
 | |
|   CheckLoadBuffer;
 | |
|   while true do
 | |
|   begin
 | |
|     case fBuf[fPos] of
 | |
|       #0     : ErrorStr(SParUnterminatedString);
 | |
|       #13,#10 : ErrorStr(SParUnterminatedString);
 | |
|       ''''   : begin
 | |
|                  inc(fPos);
 | |
|                  CheckLoadBuffer;
 | |
|                  if fBuf[fPos]<>'''' then exit;
 | |
|                end;
 | |
|     end;
 | |
|     Result:=Result+fBuf[fPos];
 | |
|     inc(fPos);
 | |
|     CheckLoadBuffer;
 | |
|   end;
 | |
| end;
 | |
| 
 | |
| procedure TParser.HandleDecimalCharacter(var ascii: boolean; out
 | |
|   WideChr: widechar; out StringChr: char);
 | |
| var i : integer;
 | |
| begin
 | |
|   inc(fPos);
 | |
|   CheckLoadBuffer;
 | |
|   // read a word number
 | |
|   i:=0;
 | |
|   while IsNumber and (i<high(word)) do
 | |
|   begin
 | |
|     i:=i*10+ord(fBuf[fPos])-ord('0');
 | |
|     inc(fPos);
 | |
|     CheckLoadBuffer;
 | |
|   end;
 | |
|   if i>high(word) then i:=0;
 | |
|   if i>127 then ascii:=false;
 | |
|   WideChr:=widechar(word(i));
 | |
|   if i<256 then
 | |
|     StringChr:=chr(i)
 | |
|   else
 | |
|     StringChr:=#0;
 | |
| end;
 | |
| 
 | |
| procedure TParser.HandleString;
 | |
| var ascii : boolean;
 | |
|   s: string;
 | |
|   w: WideChar;
 | |
|   c: char;
 | |
| begin
 | |
|   fLastTokenWStr:='';
 | |
|   fLastTokenStr:='';
 | |
|   ascii:=true;
 | |
|   while true do
 | |
|   begin
 | |
|     case fBuf[fPos] of
 | |
|       '''' :
 | |
|         begin
 | |
|           // avoid conversions,
 | |
|           // On some systems conversion from ansistring to widestring and back
 | |
|           // to ansistring does not give the original ansistring.
 | |
|           // See bug http://bugs.freepascal.org/view.php?id=15841
 | |
|           s:=HandleQuotedString;
 | |
|           fLastTokenWStr:=fLastTokenWStr+s;
 | |
|           fLastTokenStr:=fLastTokenStr+s;
 | |
|         end;
 | |
|       '#'  :
 | |
|         begin
 | |
|           HandleDecimalCharacter(ascii,w,c);
 | |
|           fLastTokenWStr:=fLastTokenWStr+w;
 | |
|           fLastTokenStr:=fLastTokenStr+c;
 | |
|         end;
 | |
|       else break;
 | |
|     end;
 | |
|   end;
 | |
|   if ascii then
 | |
|     fToken:=Classes.toString
 | |
|   else
 | |
|     fToken:=toWString;
 | |
| end;
 | |
| 
 | |
| procedure TParser.HandleMinus;
 | |
| begin
 | |
|   inc(fPos);
 | |
|   CheckLoadBuffer;
 | |
|   if IsNumber then
 | |
|   begin
 | |
|     HandleNumber;
 | |
|     fLastTokenStr:='-'+fLastTokenStr;
 | |
|   end
 | |
|   else
 | |
|   begin
 | |
|     fToken:='-';
 | |
|     fLastTokenStr:=fToken;
 | |
|   end;
 | |
| end;
 | |
| 
 | |
| procedure TParser.HandleUnknown;
 | |
| begin
 | |
|   fToken:=fBuf[fPos];
 | |
|   fLastTokenStr:=fToken;
 | |
|   inc(fPos);
 | |
| end;
 | |
| 
 | |
| constructor TParser.Create(Stream: TStream);
 | |
| begin
 | |
|   fStream:=Stream;
 | |
|   fBuf:=GetMem(ParseBufSize+1);
 | |
|   fBufLen:=0;
 | |
|   fPos:=0;
 | |
|   fDeltaPos:=1;
 | |
|   fSourceLine:=1;
 | |
|   fEofReached:=false;
 | |
|   fLastTokenStr:='';
 | |
|   fLastTokenWStr:='';
 | |
|   fFloatType:=#0;
 | |
|   fToken:=#0;
 | |
|   LoadBuffer;
 | |
|   SkipBom;
 | |
|   NextToken;
 | |
| end;
 | |
| 
 | |
| destructor TParser.Destroy;
 | |
| begin
 | |
|   fStream.Position:=SourcePos;
 | |
|   FreeMem(fBuf);
 | |
| end;
 | |
| 
 | |
| procedure TParser.CheckToken(T: Char);
 | |
| begin
 | |
|   if fToken<>T then
 | |
|     ErrorFmt(SParWrongTokenType,[GetTokenName(T),GetTokenName(fToken)]);
 | |
| end;
 | |
| 
 | |
| procedure TParser.CheckTokenSymbol(const S: string);
 | |
| begin
 | |
|   CheckToken(toSymbol);
 | |
|   if CompareText(fLastTokenStr,S)<>0 then
 | |
|     ErrorFmt(SParWrongTokenSymbol,[s,fLastTokenStr]);
 | |
| end;
 | |
| 
 | |
| procedure TParser.Error(const Ident: string);
 | |
| begin
 | |
|   ErrorStr(Ident);
 | |
| end;
 | |
| 
 | |
| procedure TParser.ErrorFmt(const Ident: string; const Args: array of const);
 | |
| begin
 | |
|   ErrorStr(Format(Ident,Args));
 | |
| end;
 | |
| 
 | |
| procedure TParser.ErrorStr(const Message: string);
 | |
| begin
 | |
|   raise EParserError.CreateFmt(Message+SParLocInfo,[SourceLine,fPos+fDeltaPos,SourcePos]);
 | |
| end;
 | |
| 
 | |
| procedure TParser.HexToBinary(Stream: TStream);
 | |
| var outbuf : array[0..ParseBufSize-1] of byte;
 | |
|     b : byte;
 | |
|     i : integer;
 | |
| begin
 | |
|   i:=0;
 | |
|   SkipWhitespace;
 | |
|   while IsHexNum do
 | |
|   begin
 | |
|     b:=(GetHexValue(fBuf[fPos]) shl 4);
 | |
|     inc(fPos);
 | |
|     CheckLoadBuffer;
 | |
|     if not IsHexNum then
 | |
|       Error(SParUnterminatedBinValue);
 | |
|     b:=b or GetHexValue(fBuf[fPos]);
 | |
|     inc(fPos);
 | |
|     outbuf[i]:=b;
 | |
|     inc(i);
 | |
|     if i>=ParseBufSize then
 | |
|     begin
 | |
|       Stream.WriteBuffer(outbuf[0],i);
 | |
|       i:=0;
 | |
|     end;
 | |
|     SkipWhitespace;
 | |
|   end;
 | |
|   if i>0 then
 | |
|     Stream.WriteBuffer(outbuf[0],i);
 | |
|   NextToken;
 | |
| end;
 | |
| 
 | |
| function TParser.NextToken: Char;
 | |
| 
 | |
| begin
 | |
|   SkipWhiteSpace;
 | |
|   if fEofReached then
 | |
|     HandleEof
 | |
|   else
 | |
|     case fBuf[fPos] of
 | |
|       '_','A'..'Z','a'..'z' : HandleAlphaNum;
 | |
|       '$'                   : HandleHexNumber;
 | |
|       '-'                   : HandleMinus;
 | |
|       '0'..'9'              : HandleNumber;
 | |
|       '''','#'              : HandleString
 | |
|       else
 | |
|         HandleUnknown;
 | |
|     end;
 | |
|   Result:=fToken;
 | |
| end;
 | |
| 
 | |
| function TParser.SourcePos: Longint;
 | |
| begin
 | |
|   Result:=fStream.Position-fBufLen+fPos;
 | |
| end;
 | |
| 
 | |
| function TParser.TokenComponentIdent: string;
 | |
| begin
 | |
|   if fToken<>toSymbol then
 | |
|     ErrorFmt(SParExpected,[GetTokenName(toSymbol)]);
 | |
|   CheckLoadBuffer;
 | |
|   while fBuf[fPos]='.' do
 | |
|   begin
 | |
|     ProcessChar;
 | |
|     fLastTokenStr:=fLastTokenStr+GetAlphaNum;
 | |
|   end;
 | |
|   Result:=fLastTokenStr;
 | |
| end;
 | |
| 
 | |
| {$ifndef FPUNONE}
 | |
| Function TParser.TokenFloat: Extended;
 | |
| 
 | |
| var errcode : word;
 | |
| 
 | |
| begin
 | |
|   Val(fLastTokenStr,Result,errcode);
 | |
|   if errcode<>0 then
 | |
|     ErrorFmt(SParInvalidFloat,[fLastTokenStr]);
 | |
| end;
 | |
| {$endif}
 | |
| 
 | |
| Function TParser.TokenInt: Int64;
 | |
| begin
 | |
|   if not TryStrToInt64(fLastTokenStr,Result) then
 | |
|     Result:=Int64(StrToQWord(fLastTokenStr)); //second chance for malformed files
 | |
| end;
 | |
| 
 | |
| function TParser.TokenString: string;
 | |
| begin
 | |
|   case fToken of
 | |
|     toWString : Result:=fLastTokenWStr;
 | |
|     toFloat : if fFloatType<>#0 then
 | |
|                 Result:=fLastTokenStr+fFloatType
 | |
|               else Result:=fLastTokenStr
 | |
|     else
 | |
|       Result:=fLastTokenStr;
 | |
|   end;
 | |
| end;
 | |
| 
 | |
| function TParser.TokenWideString: WideString;
 | |
| begin
 | |
|   if fToken=toWString then
 | |
|     Result:=fLastTokenWStr
 | |
|   else
 | |
|     Result:=fLastTokenStr;
 | |
| end;
 | |
| 
 | |
| function TParser.TokenSymbolIs(const S: string): Boolean;
 | |
| begin
 | |
|   Result:=(fToken=toSymbol) and (CompareText(fLastTokenStr,S)=0);
 | |
| end;
 | |
| 
 | 
