| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677 | { Author: Mattias Gaertner  2017  [email protected]  Abstract:    Low level file path handling.}unit Pas2jsFileUtils;{$mode objfpc}{$H+}{$i pas2js_defines.inc}interfaceuses  {$IFDEF Unix}  BaseUnix,  {$ENDIF}  SysUtils, Classes;function FilenameIsAbsolute(const aFilename: string):boolean;function FilenameIsWinAbsolute(const aFilename: string):boolean;function FilenameIsUnixAbsolute(const aFilename: string):boolean;function FileIsInPath(const Filename, Path: string): boolean;function ChompPathDelim(const Path: string): string;function ExpandFileNameUTF8(const FileName: string; {const} BaseDir: string = ''): string;function ExpandDirectory(const aDirectory: string): string;function TryCreateRelativePath(const Filename, BaseDirectory: String;  UsePointDirectory: boolean; out RelPath: String): Boolean;function ResolveDots(const AFilename: string): string;procedure ForcePathDelims(Var FileName: string);function GetForcedPathDelims(Const FileName: string): String;function ExtractFilenameOnly(const aFilename: string): string;function GetCurrentDirUTF8: String;function CompareFilenames(const File1, File2: string): integer;function GetPhysicalFilename(const Filename: string;        ExceptionOnError: boolean): string;function ResolveSymLinks(const Filename: string;                 {%H-}ExceptionOnError: boolean): string; // if a link is broken returns ''procedure FindMatchingFiles(Mask: string; MaxCount: integer; Files: TStrings);// find files, matching * and ?function GetEnvironmentVariableCountUTF8: Integer;function GetEnvironmentStringUTF8(Index: Integer): string;function GetEnvironmentVariableUTF8(const EnvVar: string): String;function GetNextDelimitedItem(const List: string; Delimiter: char;                              var Position: integer): string;type TChangeStamp = SizeInt;const InvalidChangeStamp = low(TChangeStamp);procedure IncreaseChangeStamp(var Stamp: TChangeStamp);const  UTF8BOM = #$EF#$BB#$BF;  EncodingUTF8 = 'UTF-8';  EncodingSystem = 'System';function NormalizeEncoding(const Encoding: string): string;function IsNonUTF8System: boolean;// true if system encoding is not UTF-8function UTF8CharacterStrictLength(P: PChar): integer;function GetDefaultTextEncoding: string;function GetConsoleTextEncoding: string;{$IFDEF Windows}// AConsole - If false, it is the general system encoding,//            if true, it is the console encodingfunction GetWindowsEncoding(AConsole: Boolean = False): string;{$ENDIF}{$IF defined(Unix) and not defined(Darwin)}function GetUnixEncoding: string;{$ENDIF}function IsASCII(const s: string): boolean; inline;function UTF8ToUTF16(const s: string): UnicodeString;function UTF16ToUTF8(const s: UnicodeString): string;function UTF8ToSystemCP(const s: string): string;function SystemCPToUTF8(const s: string): string;function ConsoleToUTF8(const s: string): string;// converts UTF8 string to console encoding (used by Write, WriteLn)function UTF8ToConsole(const s: string): string;implementation{$IFDEF Windows}uses Windows;{$ENDIF}var  EncodingValid: boolean = false;  DefaultTextEncoding: string = EncodingSystem;  {$IFDEF Unix}  {$IFNDEF Darwin}  Lang: string = '';  {$ENDIF}  {$ENDIF}  NonUTF8System: boolean = false;function FilenameIsWinAbsolute(const aFilename: string): boolean;begin  Result:=((length(aFilename)>=3) and           (aFilename[1] in ['A'..'Z','a'..'z']) and (aFilename[2]=':')  and (aFilename[3]in AllowDirectorySeparators))      or ((length(aFilename)>=2) and (aFilename[1] in AllowDirectorySeparators) and (aFilename[2] in AllowDirectorySeparators));end;function FilenameIsUnixAbsolute(const aFilename: string): boolean;begin  Result:=(aFilename<>'') and (aFilename[1]='/');end;function FileIsInPath(const Filename, Path: string): boolean;var  ExpFile: String;  ExpPath: String;  l: integer;begin  if Path='' then begin    Result:=false;    exit;  end;  ExpFile:=Filename;  ExpPath:=IncludeTrailingPathDelimiter(Path);  l:=length(ExpPath);  Result:=(l>0) and (length(ExpFile)>l) and (ExpFile[l]=PathDelim)          and (AnsiCompareFileName(ExpPath,LeftStr(ExpFile,l))=0);end;function ChompPathDelim(const Path: string): string;var  Len, MinLen: Integer;begin  Result:=Path;  if Path = '' then    exit;  Len:=length(Result);  if (Result[1] in AllowDirectorySeparators) then begin    MinLen := 1;    {$IFDEF HasUNCPaths}    if (Len >= 2) and (Result[2] in AllowDirectorySeparators) then      MinLen := 2; // keep UNC '\\', chomp 'a\' to 'a'    {$ENDIF}  end  else begin    MinLen := 0;    {$IFdef MSWindows}    if (Len >= 3) and (Result[1] in ['a'..'z', 'A'..'Z'])  and       (Result[2] = ':') and (Result[3] in AllowDirectorySeparators)    then      MinLen := 3;    {$ENDIF}  end;  while (Len > MinLen) and (Result[Len] in AllowDirectorySeparators) do dec(Len);  if Len<length(Result) then    SetLength(Result,Len);end;function ExpandDirectory(const aDirectory: string): string;begin  Result:=aDirectory;  if Result='' then exit;  Result:=ExpandFileNameUTF8(Result);  if Result='' then exit;  Result:=IncludeTrailingPathDelimiter(Result);end;function TryCreateRelativePath(const Filename, BaseDirectory: String;  UsePointDirectory: boolean; out RelPath: String): Boolean;{  Returns True if it is possible to create a relative path from Source to Dest  Function must be thread safe, so no expanding of filenames is done, since this  is not threadsafe (at least on Windows platform)  - Dest and Source must either be both absolute filenames, or relative  - Dest and Source cannot contain '..' since no expanding is done by design  - Dest and Source must be on same drive or UNC path (Windows)  - if both Dest and Source are relative they must at least share their base directory  - Double PathDelims are ignored (unless they are part of the UNC convention)  - if UsePointDirectory is True and Result is True then if RelPath is Empty string, RelPath becomes '.'  - if AlwaysRequireSharedBaseFolder is False then Absolute filenames need not share a basefolder  - if the function succeeds RelPath contains the relative path from Source to Dest,    no PathDelimiter is appended to the end of RelPath  Examples:  - Filename = /foo/bar BaseDirectory = /foo Result = True RelPath = bar  - Filename = /foo///bar BaseDirectory = /foo// Result = True RelPath = bar  - Filename = /foo BaseDirectory = /foo/bar Result = True RelPath = ../  - Filename = /foo/bar BaseDirectory = /bar Result = False (no shared base directory)  - Filename = foo/bar BaseDirectory = foo/foo Result = True RelPath = ../bar  - Filename = foo/bar BaseDirectory = bar/foo Result = False (no shared base directory)  - Filename = /foo BaseDirectory = bar Result = False (mixed absolute and relative)}  function IsNameChar(c: char): boolean; inline;  begin    Result:=(c<>#0) and not (c in AllowDirectorySeparators);  end;var  UpDirCount: Integer;  ResultPos: Integer;  i: Integer;  FileNameRestLen, SharedDirs: Integer;  FileP, BaseP, FileEndP, BaseEndP: PChar;begin  Result:=false;  RelPath:=Filename;  if (BaseDirectory='') or (Filename='') then exit;  // check for different windows file drives  if (CompareText(ExtractFileDrive(Filename),                     ExtractFileDrive(BaseDirectory))<>0)  then    exit;  FileP:=PChar(Filename);  BaseP:=PChar(BaseDirectory);  //writeln('TryCreateRelativePath START File="',FileP,'" Base="',BaseP,'"');  // skip matching directories  SharedDirs:=0;  if FileP^ in AllowDirectorySeparators then begin    if not (BaseP^ in AllowDirectorySeparators) then exit;    repeat      while FileP^ in AllowDirectorySeparators do inc(FileP);      while BaseP^ in AllowDirectorySeparators do inc(BaseP);      if (FileP^=#0) or (BaseP^=#0) then break;      //writeln('TryCreateRelativePath check match .. File="',FileP,'" Base="',BaseP,'"');      FileEndP:=FileP;      BaseEndP:=BaseP;      while IsNameChar(FileEndP^) do inc(FileEndP);      while IsNameChar(BaseEndP^) do inc(BaseEndP);      if CompareFilenames(copy(Filename,FileP-PChar(Filename)+1,FileEndP-FileP),        copy(BaseDirectory,BaseP-PChar(BaseDirectory)+1,BaseEndP-BaseP))<>0      then        break;      FileP:=FileEndP;      BaseP:=BaseEndP;      inc(SharedDirs);    until false;  end else if (BaseP^ in AllowDirectorySeparators) then    exit;  //writeln('TryCreateRelativePath skipped matches File="',FileP,'" Base="',BaseP,'"');  if SharedDirs=0 then exit;  // calculate needed '../'  UpDirCount:=0;  BaseEndP:=BaseP;  while IsNameChar(BaseEndP^) do begin    inc(UpDirCount);    while IsNameChar(BaseEndP^) do inc(BaseEndP);    while BaseEndP^ in AllowDirectorySeparators do inc(BaseEndP);  end;  //writeln('TryCreateRelativePath UpDirCount=',UpDirCount,' File="',FileP,'" Base="',BaseP,'"');  // create relative filename  if (FileP^=#0) and (UpDirCount=0) then begin    // Filename is the BaseDirectory    if UsePointDirectory then      RelPath:='.'    else      RelPath:='';    exit(true);  end;  FileNameRestLen:=length(Filename)-(FileP-PChar(Filename));  SetLength(RelPath,3*UpDirCount+FileNameRestLen);  ResultPos:=1;  for i:=1 to UpDirCount do begin    RelPath[ResultPos]:='.';    RelPath[ResultPos+1]:='.';    RelPath[ResultPos+2]:=PathDelim;    inc(ResultPos,3);  end;  if FileNameRestLen>0 then    Move(FileP^,RelPath[ResultPos],FileNameRestLen);  Result:=true;end;function ResolveDots(const AFilename: string): string;//trim double path delims and expand special dirs like .. and .//on Windows change also '/' to '\' except for filenames starting with '\\?\'var SrcPos, DestPos, l, DirStart: integer;  c: char;  MacroPos: LongInt;begin  Result:=AFilename;  {$ifdef windows}  //Special case: everything is literal after this, even dots (this does not apply to '//?/')  if (Pos('\\?\', AFilename) = 1) then Exit;  {$endif}  l:=length(AFilename);  SrcPos:=1;  DestPos:=1;  // trim double path delimiters and special dirs . and ..  while (SrcPos<=l) do begin    c:=AFilename[SrcPos];    {$ifdef windows}    //change / to \. The WinApi accepts both, but it leads to strange effects in other places    if (c in AllowDirectorySeparators) then c := PathDelim;    {$endif}    // check for double path delims    if (c=PathDelim) then begin      inc(SrcPos);      {$IFDEF Windows}      if (DestPos>2)      {$ELSE}      if (DestPos>1)      {$ENDIF}      and (Result[DestPos-1]=PathDelim) then begin        // skip second PathDelim        continue;      end;      Result[DestPos]:=c;      inc(DestPos);      continue;    end;    // check for special dirs . and ..    if (c='.') then begin      if (SrcPos<l) then begin        if (AFilename[SrcPos+1]=PathDelim)        and ((DestPos=1) or (AFilename[SrcPos-1]=PathDelim)) then begin          // special dir ./ or */./          // -> skip          inc(SrcPos,2);          continue;        end else if (AFilename[SrcPos+1]='.')        and (SrcPos+1=l) or (AFilename[SrcPos+2]=PathDelim) then        begin          // special dir ..          //  1. ..      -> copy          //  2. /..     -> skip .., keep /          //  3. C:..    -> copy          //  4. C:\..   -> skip .., keep C:\          //  5. \\..    -> skip .., keep \\          //  6. ../..   -> copy because if the first '..' was not resolved, the next can't neither          //  7. dir/..  -> trim dir and ..          //  8. dir$macro/..  -> copy          if DestPos=1 then begin            //  1. .. or ../  -> copy          end else if (DestPos=2) and (Result[1]=PathDelim) then begin            //  2. /..     -> skip .., keep /            inc(SrcPos,2);            continue;          {$IFDEF Windows}          end else if (DestPos=3) and (Result[2]=':')          and (Result[1] in ['a'..'z','A'..'Z']) then begin            //  3. C:..    -> copy          end else if (DestPos=4) and (Result[2]=':') and (Result[3]=PathDelim)          and (Result[1] in ['a'..'z','A'..'Z']) then begin            //  4. C:\..   -> skip .., keep C:\            inc(SrcPos,2);            continue;          end else if (DestPos=3) and (Result[1]=PathDelim)          and (Result[2]=PathDelim) then begin            //  5. \\..    -> skip .., keep \\            inc(SrcPos,2);            continue;          {$ENDIF}          end else if (DestPos>1) and (Result[DestPos-1]=PathDelim) then begin            // */.            if (DestPos>3)            and (Result[DestPos-2]='.') and (Result[DestPos-3]='.')            and ((DestPos=4) or (Result[DestPos-4]=PathDelim)) then begin              //  6. ../..   -> copy because if the first '..' was not resolved, the next can't neither            end else begin              //  7. xxxdir/..  -> trim dir and skip ..              DirStart:=DestPos-2;              while (DirStart>1) and (Result[DirStart-1]<>PathDelim) do                dec(DirStart);              MacroPos:=DirStart;              while MacroPos<DestPos do begin                if (Result[MacroPos]='$')                and (Result[MacroPos+1] in ['(','a'..'z','A'..'Z']) then begin                  // 8. directory contains a macro -> keep                  break;                end;                inc(MacroPos);              end;              if MacroPos=DestPos then begin                // previous directory does not contain a macro -> remove dir/..                DestPos:=DirStart;                inc(SrcPos,2);                //writeln('ResolveDots ',DestPos,' SrcPos=',SrcPos,' File="',AFilename,'" Result="',copy(Result,1,DestPos-1),'"');                if SrcPos>l then begin                  // '..' at end of filename                  if (DestPos>1) and (Result[DestPos-1]<>PathDelim) then begin                    // foo/dir/.. -> foo                    dec(DestPos);                  end else if (DestPos=1) then begin                    // foo/.. -> .                    Result[1]:='.';                    DestPos:=2;                  end;                end else if DestPos=1 then begin                  // e.g. 'foo/../'                  while (SrcPos<=l) and (AFilename[SrcPos] in AllowDirectorySeparators) do                    inc(SrcPos);                end;                continue;              end;            end;          end;        end;      end else begin        // special dir . at end of filename        if DestPos=1 then begin          Result:='.';          exit;        end else begin          // skip          break;        end;      end;    end;    // copy directory    repeat      Result[DestPos]:=c;      inc(DestPos);      inc(SrcPos);      if (SrcPos>l) then break;      c:=AFilename[SrcPos];      {$ifdef windows}      //change / to \. The WinApi accepts both, but it leads to strange effects in other places      if (c in AllowDirectorySeparators) then c := PathDelim;      {$endif}      if c=PathDelim then break;    until false;  end;  // trim result  if DestPos<=length(AFilename) then    SetLength(Result,DestPos-1);end;procedure ForcePathDelims(Var FileName: string);var  i: Integer;begin  for i:=1 to length(FileName) do    {$IFDEF Windows}    if Filename[i]='/' then      Filename[i]:='\';    {$ELSE}    if Filename[i]='\' then      Filename[i]:='/';    {$ENDIF}end;function GetForcedPathDelims(const FileName: string): String;begin  Result:=FileName;  ForcePathDelims(Result);end;function ExtractFilenameOnly(const aFilename: string): string;var  StartPos: Integer;  ExtPos: Integer;begin  StartPos:=length(AFilename)+1;  while (StartPos>1)  and not (AFilename[StartPos-1] in AllowDirectorySeparators)  {$IFDEF Windows}and (AFilename[StartPos-1]<>':'){$ENDIF}  do    dec(StartPos);  ExtPos:=length(AFilename);  while (ExtPos>=StartPos) and (AFilename[ExtPos]<>'.') do    dec(ExtPos);  if (ExtPos<StartPos) then ExtPos:=length(AFilename)+1;  Result:=copy(AFilename,StartPos,ExtPos-StartPos);end;function CompareFilenames(const File1, File2: string): integer;begin  Result:=AnsiCompareFileName(File1,File2);end;procedure FindMatchingFiles(Mask: string; MaxCount: integer; Files: TStrings);var  p: Integer;  Path, Filename: String;  Info: TRawByteSearchRec;begin  Mask:=ResolveDots(Mask);  p:=1;  while p<=length(Mask) do begin    if Mask[p] in ['*','?'] then begin      while (p<=length(Mask)) and not (Mask[p] in AllowDirectorySeparators) do inc(p);      Path:=LeftStr(Mask,p-1);      if FindFirst(Path,faAnyFile,Info)=0 then begin        repeat          if (Info.Name='') or (Info.Name='.') or (Info.Name='..') then continue;          Filename:=ExtractFilePath(Path)+Info.Name;          if p>length(Mask) then begin            // e.g. /path/unit*.pas            if Files.Count>=MaxCount then              raise EListError.Create('found too many files "'+Path+'"');            Files.Add(Filename);          end else begin            // e.g. /path/sub*path/...            FindMatchingFiles(Filename+copy(Mask,p,length(Mask)),MaxCount,Files);          end;        until FindNext(Info)<>0;      end;      exit;    end;    inc(p);  end;  if FileExists(Mask) then begin    if Files.Count>=MaxCount then      raise EListError.Create('found too many files "'+Mask+'"');    Files.Add(Mask);  end;end;function GetNextDelimitedItem(const List: string; Delimiter: char;  var Position: integer): string;var  StartPos: Integer;begin  StartPos:=Position;  while (Position<=length(List)) and (List[Position]<>Delimiter) do    inc(Position);  Result:=copy(List,StartPos,Position-StartPos);  if Position<=length(List) then inc(Position); // skip Delimiterend;procedure IncreaseChangeStamp(var Stamp: TChangeStamp);begin  if Stamp<High(TChangeStamp) then    inc(Stamp)  else    Stamp:=InvalidChangeStamp+1;end;function IsNonUTF8System: boolean;begin  Result:=NonUTF8System;end;function UTF8CharacterStrictLength(P: PChar): integer;begin  if p=nil then exit(0);  if ord(p^)<%10000000 then begin    // regular single byte character    exit(1);  end  else if ord(p^)<%11000000 then begin    // invalid single byte character    exit(0);  end  else if ((ord(p^) and %11100000) = %11000000) then begin    // should be 2 byte character    if (ord(p[1]) and %11000000) = %10000000 then      exit(2)    else      exit(0);  end  else if ((ord(p^) and %11110000) = %11100000) then begin    // should be 3 byte character    if ((ord(p[1]) and %11000000) = %10000000)    and ((ord(p[2]) and %11000000) = %10000000) then      exit(3)    else      exit(0);  end  else if ((ord(p^) and %11111000) = %11110000) then begin    // should be 4 byte character    if ((ord(p[1]) and %11000000) = %10000000)    and ((ord(p[2]) and %11000000) = %10000000)    and ((ord(p[3]) and %11000000) = %10000000) then      exit(4)    else      exit(0);  end else    exit(0);end;function GetDefaultTextEncoding: string;begin  if EncodingValid then begin    Result:=DefaultTextEncoding;    exit;  end;  {$IFDEF Windows}  Result:=GetWindowsEncoding;  {$ELSE}  {$IFDEF Darwin}  Result:=EncodingUTF8;  {$ELSE}  Lang := GetEnvironmentVariable('LC_ALL');  if Lang='' then begin    Lang := GetEnvironmentVariable('LC_MESSAGES');    if Lang='' then      Lang := GetEnvironmentVariable('LANG');  end;  Result:=GetUnixEncoding;  {$ENDIF}  {$ENDIF}  Result:=NormalizeEncoding(Result);  DefaultTextEncoding:=Result;  EncodingValid:=true;end;function NormalizeEncoding(const Encoding: string): string;var  i: Integer;begin  Result:=LowerCase(Encoding);  for i:=length(Result) downto 1 do    if Result[i]='-' then Delete(Result,i,1);end;function IsASCII(const s: string): boolean; inline;var  p: PChar;begin  if s='' then exit(true);  p:=PChar(s);  repeat    case p^ of    #0: if p-PChar(s)=length(s) then exit(true);    #128..#255: exit(false);    end;    inc(p);  until false;end;function UTF8ToUTF16(const s: string): UnicodeString;begin  Result:=UTF8Decode(s);end;function UTF16ToUTF8(const s: UnicodeString): string;begin  if s='' then exit('');  Result:=UTF8Encode(s);  // prevent UTF8 codepage appear in the strings - we don't need codepage  // conversion magic  SetCodePage(RawByteString(Result), CP_ACP, False);end;{$IFDEF Unix}  {$I pas2jsfileutilsunix.inc}{$ENDIF}{$IFDEF Windows}  {$I pas2jsfileutilswin.inc}{$ENDIF}procedure InternalInit;begin  SetMultiByteConversionCodePage(CP_UTF8);  // SetMultiByteFileSystemCodePage(CP_UTF8); not needed, this is the default under Windows  SetMultiByteRTLFileSystemCodePage(CP_UTF8);  GetDefaultTextEncoding;  {$IFDEF Windows}  NonUTF8System:=true;  {$ELSE}  NonUTF8System:=SysUtils.CompareText(DefaultTextEncoding,'UTF8')<>0;  {$ENDIF}  InitPlatform;end;initialization  InternalInit;finalization  FinalizePlatform;end.
 |