lazarus/components/lazutils/lookupstringlist.pas
2021-02-05 11:27:59 +00:00

174 lines
4.4 KiB
ObjectPascal

{
*****************************************************************************
This file is part of LazUtils.
See the file COPYING.modifiedLGPL.txt, included in this distribution,
for details about the license.
*****************************************************************************
Author: Juha Manninen / Antônio Galvão
Abstract:
This is an unsorted StringList with a fast lookup feature.
Internally it uses a map container to store the strings again
which is then used for Contains, IndexOf and Find methods.
The extra container does not reserve too much memory because the strings are
reference counted and not really copied.
All Duplicates property values are fully supported,
including dupIgnore and dupError, unlike in unsorted StringList.
This class is useful only when you must preserve the order in list, but
also need to do fast lookups to see if a string exists, or must prevent duplicates.
}
unit LookupStringList;
{$mode objfpc}{$H+}
interface
uses
Classes, SysUtils, AvgLvlTree;
type
{ TLookupStringList }
TLookupStringList = class(TStringList)
private
FMap: TStringMap;
protected
procedure InsertItem(Index: Integer; const S: string); override;
public
constructor Create(aCaseSensitive: Boolean);
constructor Create;
destructor Destroy; override;
procedure Assign(Source: TPersistent); override;
procedure Clear; override;
procedure Delete(Index: Integer); override;
function Add(const S: string): Integer; override;
function AddObject(const S: string; AObject: TObject): Integer; override;
function Contains(const S: string): Boolean; // A new function
function Find(const S: string; out Index: Integer): Boolean; override;
function IndexOf(const S: string): Integer; override;
end;
function Deduplicate(AStrings: TStrings): Integer;
implementation
function Deduplicate(AStrings: TStrings): Integer;
// Removes duplicate strings (case sensitive) from AStrings.
// Returns the number of duplicates removed.
var
DSL: TLookupStringList;
InCnt: Integer;
begin
InCnt := AStrings.Count;
DSL := TLookupStringList.Create(True);
try
DSL.Assign(AStrings);
AStrings.Assign(DSL);
Result := InCnt - AStrings.Count;
finally
DSL.Free;
end;
end;
{ TLookupStringList }
constructor TLookupStringList.Create(aCaseSensitive: Boolean);
begin
inherited Create;
CaseSensitive := aCaseSensitive;
FMap := TStringMap.Create(aCaseSensitive);
end;
constructor TLookupStringList.Create;
begin
Create(False); // Case-insensitive by default
end;
destructor TLookupStringList.Destroy;
begin
FMap.Free;
inherited Destroy;
end;
procedure TLookupStringList.Assign(Source: TPersistent);
begin
inherited Assign(Source);
if Source is TLookupStringList then
FMap.Assign(TLookupStringList(Source).FMap);
end;
procedure TLookupStringList.Clear;
begin
inherited Clear;
FMap.Clear;
end;
procedure TLookupStringList.Delete(Index: Integer);
var
s: String;
begin
s := Strings[Index];
inherited Delete(Index);
// The string must not be deleted from map if there are duplicates.
// Calling IndexOf is slow but it is needed.
if (Duplicates <> dupAccept) or (inherited IndexOf(s) = -1) then
FMap.Remove(s);
end;
function TLookupStringList.Add(const S: string): Integer;
begin
if not Sorted and (Duplicates = dupIgnore) and FMap.Contains(S) then
Result := -1
else
Result := inherited Add(S);
end;
function TLookupStringList.AddObject(const S: string; AObject: TObject): Integer;
begin
Result := Add(S);
if Result > -1 then
Objects[Result] := AObject;
end;
procedure TLookupStringList.InsertItem(Index: Integer; const S: string);
begin
if not Sorted and (Duplicates <> dupAccept) then
if FMap.Contains(S) then
case Duplicates of
DupIgnore : Exit;
DupError : raise Exception.Create('TLookupStringList.InsertItem:'
+' Duplicates are not allowed.');
end;
inherited InsertItem(Index, S);
FMap.Add(S); // Insert string to map, too.
end;
function TLookupStringList.Contains(const S: string): Boolean;
begin
Result := FMap.Contains(S);
end;
function TLookupStringList.Find(const S: string; out Index: Integer): Boolean;
begin
Index := IndexOf(S);
Result := Index <> -1;
end;
function TLookupStringList.IndexOf(const S: string): Integer;
begin
if FMap.Contains(S) then
Result := inherited IndexOf(S)
else
Result := -1
end;
end.