{ ***************************************************************************** This file is part of LazUtils. See the file COPYING.modifiedLGPL.txt, included in this distribution, for details about the license. ***************************************************************************** Author: Juha Manninen / Antônio Galvão Abstract: This is an unsorted StringList with a fast lookup feature. Internally it uses a map container to store the strings again which is then used for Contains, IndexOf and Find methods. The extra container does not reserve too much memory because the strings are reference counted and not really copied. All Duplicates property values are fully supported, including dupIgnore and dupError, unlike in unsorted StringList. This class is useful only when you must preserve the order in list, but also need to do fast lookups to see if a string exists, or must prevent duplicates. } unit LookupStringList; {$mode objfpc}{$H+} interface uses Classes, SysUtils, AvgLvlTree; type { TLookupStringList } TLookupStringList = class(TStringList) private FMap: TStringMap; protected procedure InsertItem(Index: Integer; const S: string); override; public constructor Create(aCaseSensitive: Boolean); constructor Create; destructor Destroy; override; procedure Assign(Source: TPersistent); override; procedure Clear; override; procedure Delete(Index: Integer); override; function Add(const S: string): Integer; override; function AddObject(const S: string; AObject: TObject): Integer; override; function Contains(const S: string): Boolean; // A new function function Find(const S: string; out Index: Integer): Boolean; override; function IndexOf(const S: string): Integer; override; end; function Deduplicate(AStrings: TStrings): Integer; implementation function Deduplicate(AStrings: TStrings): Integer; // Removes duplicate strings (case sensitive) from AStrings. // Returns the number of duplicates removed. var DSL: TLookupStringList; InCnt: Integer; begin InCnt := AStrings.Count; DSL := TLookupStringList.Create(True); try DSL.Assign(AStrings); AStrings.Assign(DSL); Result := InCnt - AStrings.Count; finally DSL.Free; end; end; { TLookupStringList } constructor TLookupStringList.Create(aCaseSensitive: Boolean); begin inherited Create; CaseSensitive := aCaseSensitive; FMap := TStringMap.Create(aCaseSensitive); end; constructor TLookupStringList.Create; begin Create(False); // Case-insensitive by default end; destructor TLookupStringList.Destroy; begin FMap.Free; inherited Destroy; end; procedure TLookupStringList.Assign(Source: TPersistent); begin inherited Assign(Source); if Source is TLookupStringList then FMap.Assign(TLookupStringList(Source).FMap); end; procedure TLookupStringList.Clear; begin inherited Clear; FMap.Clear; end; procedure TLookupStringList.Delete(Index: Integer); var s: String; begin s := Strings[Index]; inherited Delete(Index); // The string must not be deleted from map if there are duplicates. // Calling IndexOf is slow but it is needed. if (Duplicates <> dupAccept) or (inherited IndexOf(s) = -1) then FMap.Remove(s); end; function TLookupStringList.Add(const S: string): Integer; begin if not Sorted and (Duplicates = dupIgnore) and FMap.Contains(S) then Result := -1 else Result := inherited Add(S); end; function TLookupStringList.AddObject(const S: string; AObject: TObject): Integer; begin Result := Add(S); if Result > -1 then Objects[Result] := AObject; end; procedure TLookupStringList.InsertItem(Index: Integer; const S: string); begin if not Sorted and (Duplicates <> dupAccept) then if FMap.Contains(S) then case Duplicates of DupIgnore : Exit; DupError : raise Exception.Create('TLookupStringList.InsertItem:' +' Duplicates are not allowed.'); end; inherited InsertItem(Index, S); FMap.Add(S); // Insert string to map, too. end; function TLookupStringList.Contains(const S: string): Boolean; begin Result := FMap.Contains(S); end; function TLookupStringList.Find(const S: string; out Index: Integer): Boolean; begin Index := IndexOf(S); Result := Index <> -1; end; function TLookupStringList.IndexOf(const S: string): Integer; begin if FMap.Contains(S) then Result := inherited IndexOf(S) else Result := -1 end; end.