ソースを参照

rtl: add basic implementation of TEncoding class

git-svn-id: trunk@19355 -
paul 14 年 前
コミット
abf9816a09

+ 2 - 0
.gitattributes

@@ -7804,6 +7804,8 @@ rtl/objpas/sysutils/stre.inc svneol=native#text/plain
 rtl/objpas/sysutils/strg.inc svneol=native#text/plain
 rtl/objpas/sysutils/sysansi.inc svneol=native#text/plain
 rtl/objpas/sysutils/sysansih.inc svneol=native#text/plain
+rtl/objpas/sysutils/sysencoding.inc svneol=native#text/pascal
+rtl/objpas/sysutils/sysencodingh.inc svneol=native#text/pascal
 rtl/objpas/sysutils/sysformt.inc svneol=native#text/plain
 rtl/objpas/sysutils/sysint.inc svneol=native#text/plain
 rtl/objpas/sysutils/sysinth.inc svneol=native#text/plain

+ 2 - 0
rtl/objpas/sysconst.pp

@@ -121,6 +121,8 @@ resourcestring
 
   SNoToolserver                 = 'Toolserver is not installed, cannot execute Tool';
 
+  SNotValidCodePageName         = '%s is not a valid code page name';
+
   SNoArrayMatch                 = 'Can''t match any allowed value at pattern position %d, string position %d.';
   SNoCharMatch                  = 'Mismatch char "%s" <> "%s" at pattern position %d, string position %d.';
   SHHMMError                    = 'mm in a sequence hh:mm is interpreted as minutes. No longer versions allowed! (Position : %d).' ;

+ 536 - 0
rtl/objpas/sysutils/sysencoding.inc

@@ -0,0 +1,536 @@
+{$ifndef VER2_4}
+{ TEncoding }
+
+class function TEncoding.GetANSI: TEncoding;
+begin
+  if not Assigned(FStandardEncodings[seAnsi]) then
+    FStandardEncodings[seAnsi] := TMBCSEncoding.Create(DefaultSystemCodePage);
+  Result := FStandardEncodings[seAnsi];
+end;
+
+class function TEncoding.GetASCII: TEncoding;
+begin
+  if not Assigned(FStandardEncodings[seAscii]) then
+    FStandardEncodings[seAscii] := TMBCSEncoding.Create(CP_ASCII);
+  Result := FStandardEncodings[seAscii];
+end;
+
+class function TEncoding.GetBigEndianUnicode: TEncoding;
+begin
+  if not Assigned(FStandardEncodings[seBigEndianUnicode]) then
+    FStandardEncodings[seBigEndianUnicode] := TBigEndianUnicodeEncoding.Create;
+  Result := FStandardEncodings[seBigEndianUnicode];
+end;
+
+class function TEncoding.GetDefault: TEncoding;
+begin
+  Result := GetANSI;
+end;
+
+class function TEncoding.GetUnicode: TEncoding;
+begin
+  if not Assigned(FStandardEncodings[seUnicode]) then
+    FStandardEncodings[seUnicode] := TUnicodeEncoding.Create;
+  Result := FStandardEncodings[seUnicode];
+end;
+
+class function TEncoding.GetUTF7: TEncoding;
+begin
+  if not Assigned(FStandardEncodings[seUTF7]) then
+    FStandardEncodings[seUTF7] := TUTF7Encoding.Create;
+  Result := FStandardEncodings[seUTF7];
+end;
+
+class function TEncoding.GetUTF8: TEncoding;
+begin
+  if not Assigned(FStandardEncodings[seUTF8]) then
+    FStandardEncodings[seUTF8] := TUTF8Encoding.Create;
+  Result := FStandardEncodings[seUTF8];
+end;
+
+class procedure TEncoding.FreeEncodings;
+var
+  E: TStandardEncoding;
+begin
+  for E := Low(FStandardEncodings) to High(FStandardEncodings) do
+    FStandardEncodings[E].Free;
+end;
+
+class constructor TEncoding.Create;
+var
+  E: TStandardEncoding;
+begin
+  for E := Low(FStandardEncodings) to High(FStandardEncodings) do
+    FStandardEncodings[E] := nil;
+end;
+
+class destructor TEncoding.Destroy;
+begin
+  FreeEncodings;
+end;
+
+function TEncoding.Clone: TEncoding;
+begin
+  Result := nil;
+end;
+
+class function TEncoding.Convert(Source, Destination: TEncoding;
+  const Bytes: TBytes): TBytes;
+begin
+  Result := Destination.GetBytes(Source.GetChars(Bytes));
+end;
+
+class function TEncoding.Convert(Source, Destination: TEncoding;
+  const Bytes: TBytes; StartIndex, Count: Integer): TBytes;
+begin
+  Result := Destination.GetBytes(Source.GetChars(Bytes, StartIndex, Count));
+end;
+
+class function TEncoding.IsStandardEncoding(AEncoding: TEncoding): Boolean;
+var
+  Encoding: TEncoding;
+begin
+  if Assigned(AEncoding) then
+    for Encoding in FStandardEncodings do
+      if Encoding = AEncoding then
+        Exit(True);
+  Result := False;
+end;
+
+class function TEncoding.GetBufferEncoding(const Buffer: TBytes; var AEncoding: TEncoding): Integer;
+begin
+  Result := GetBufferEncoding(Buffer, AEncoding, Default);
+end;
+
+class function TEncoding.GetBufferEncoding(const Buffer: TBytes;
+  var AEncoding: TEncoding; ADefaultEncoding: TEncoding): Integer;
+
+  function CheckEncoding(AEncoding: TEncoding; out ByteCount: Integer): Boolean;
+  var
+    Preamble: TBytes;
+  begin
+    Preamble := AEncoding.GetPreamble;
+    ByteCount := Length(Preamble);
+    Result := (Length(Buffer) >= ByteCount) and (ByteCount > 0);
+    if Result then
+      Result := CompareMem(@Preamble[0], @Buffer[0], ByteCount);
+  end;
+
+begin
+  if Assigned(AEncoding) then
+  begin
+    if not CheckEncoding(AEncoding, Result) then
+      Result := 0;
+  end
+  else
+  if CheckEncoding(Unicode, Result) then
+    AEncoding := Unicode
+  else
+  if CheckEncoding(BigEndianUnicode, Result) then
+    AEncoding := BigEndianUnicode
+  else
+  if CheckEncoding(UTF8, Result) then
+    AEncoding := UTF8
+  else
+  begin
+    AEncoding := ADefaultEncoding;
+    Result := 0;
+  end;
+end;
+
+function TEncoding.GetByteCount(const Chars: TUnicodeCharArray): Integer;
+begin
+  Result := GetByteCount(Chars, 0, Length(Chars));
+end;
+
+function TEncoding.GetByteCount(const Chars: TUnicodeCharArray; CharIndex,
+  CharCount: Integer): Integer;
+begin
+  Result := GetByteCount(@Chars[CharIndex], CharCount);
+end;
+
+function TEncoding.GetByteCount(const S: UnicodeString): Integer;
+begin
+  Result := GetByteCount(PUnicodeChar(S), Length(S));
+end;
+
+function TEncoding.GetByteCount(const S: UnicodeString; CharIndex, CharCount: Integer): Integer;
+begin
+  Result := GetByteCount(@S[CharIndex], CharCount);
+end;
+
+function TEncoding.GetBytes(const Chars: TUnicodeCharArray): TBytes;
+begin
+  SetLength(Result, GetByteCount(Chars));
+  GetBytes(@Chars[0], Length(Chars), @Result[0], Length(Result));
+end;
+
+function TEncoding.GetBytes(const Chars: TUnicodeCharArray; CharIndex,
+  CharCount: Integer): TBytes;
+begin
+  SetLength(Result, GetByteCount(Chars, CharIndex, CharCount));
+  GetBytes(@Chars[CharIndex], CharCount, @Result[0], Length(Result));
+end;
+
+function TEncoding.GetBytes(const Chars: TUnicodeCharArray; CharIndex,
+  CharCount: Integer; const Bytes: TBytes; ByteIndex: Integer): Integer;
+begin
+  Result := GetBytes(@Chars[CharIndex], CharCount, @Bytes[ByteIndex], Length(Bytes) - ByteIndex);
+end;
+
+function TEncoding.GetBytes(const S: UnicodeString): TBytes;
+begin
+  SetLength(Result, GetByteCount(S));
+  GetBytes(@S[1], Length(S), @Result[0], Length(Result));
+end;
+
+function TEncoding.GetBytes(const S: UnicodeString; CharIndex, CharCount: Integer;
+  const Bytes: TBytes; ByteIndex: Integer): Integer;
+begin
+  Result := GetBytes(@S[CharIndex], CharCount, @Bytes[ByteIndex], Length(Bytes) - ByteIndex);
+end;
+
+function TEncoding.GetCharCount(const Bytes: TBytes): Integer;
+begin
+  Result := GetCharCount(@Bytes[0], Length(Bytes));
+end;
+
+function TEncoding.GetCharCount(const Bytes: TBytes; ByteIndex,
+  ByteCount: Integer): Integer;
+begin
+  Result := GetCharCount(@Bytes[ByteIndex], ByteCount);
+end;
+
+function TEncoding.GetChars(const Bytes: TBytes): TUnicodeCharArray;
+begin
+  SetLength(Result, GetCharCount(Bytes));
+  GetChars(@Bytes[0], Length(Bytes), @Result[0], Length(Result));
+end;
+
+function TEncoding.GetChars(const Bytes: TBytes; ByteIndex, ByteCount: Integer): TUnicodeCharArray;
+begin
+  SetLength(Result, GetCharCount(Bytes, ByteIndex, ByteCount));
+  GetChars(@Bytes[ByteIndex], ByteCount, @Result[0], Length(Result));
+end;
+
+function TEncoding.GetChars(const Bytes: TBytes; ByteIndex, ByteCount: Integer;
+  const Chars: TUnicodeCharArray; CharIndex: Integer): Integer;
+begin
+  Result := GetChars(@Bytes[ByteIndex], ByteCount, @Chars[CharIndex], Length(Chars) - CharIndex);
+end;
+
+class function TEncoding.GetEncoding(CodePage: Integer): TEncoding;
+begin
+  case CodePage of
+    CP_UTF16: Result := TUnicodeEncoding.Create;
+    CP_UTF16BE: Result := TBigEndianUnicodeEncoding.Create;
+    CP_UTF7: Result := TUTF7Encoding.Create;
+    CP_UTF8: Result := TUTF8Encoding.Create;
+  else
+    Result := TMBCSEncoding.Create(CodePage);
+  end;
+end;
+
+class function TEncoding.GetEncoding(const EncodingName: UnicodeString): TEncoding;
+var
+  ACodePage: TSystemCodePage;
+begin
+  ACodePage := CodePageNameToCodePage(EncodingName);
+  if ACodePage = $FFFF then
+    raise EEncodingError.CreateFmt(SNotValidCodePageName, [EncodingName]);
+  Result := TMBCSEncoding.Create(ACodePage);
+end;
+
+function TEncoding.GetString(const Bytes: TBytes): UnicodeString;
+var
+  Chars: TUnicodeCharArray;
+begin
+  Chars := GetChars(Bytes);
+  SetString(Result, PUnicodeChar(Chars), Length(Chars));
+end;
+
+function TEncoding.GetString(const Bytes: TBytes; ByteIndex, ByteCount: Integer): UnicodeString;
+var
+  Chars: TUnicodeCharArray;
+begin
+  Chars := GetChars(Bytes, ByteIndex, ByteCount);
+  SetString(Result, PUnicodeChar(Chars), Length(Chars));
+end;
+
+{ TMBCSEncoding }
+
+function TMBCSEncoding.GetByteCount(Chars: PUnicodeChar; CharCount: Integer): Integer;
+var
+  S: RawByteString;
+begin
+  widestringmanager.Unicode2AnsiMoveProc(Chars, S, CodePage, CharCount);
+  Result := Length(S);
+end;
+
+function TMBCSEncoding.GetBytes(Chars: PUnicodeChar; CharCount: Integer; Bytes: PByte;
+  ByteCount: Integer): Integer;
+var
+  S: RawByteString;
+begin
+  widestringmanager.Unicode2AnsiMoveProc(Chars, S, CodePage, CharCount);
+  Result := Length(S);
+  if ByteCount < Result then
+    Result := ByteCount;
+  if Result > 0 then
+    Move(S[1], Bytes[0], Result);
+end;
+
+function TMBCSEncoding.GetCharCount(Bytes: PByte; ByteCount: Integer): Integer;
+var
+  U: UnicodeString;
+begin
+  widestringmanager.Ansi2UnicodeMoveProc(PChar(Bytes), CodePage, U, ByteCount);
+  Result := Length(U);
+end;
+
+function TMBCSEncoding.GetChars(Bytes: PByte; ByteCount: Integer; Chars: PUnicodeChar;
+  CharCount: Integer): Integer;
+var
+  U: UnicodeString;
+begin
+  widestringmanager.Ansi2UnicodeMoveProc(PChar(Bytes), CodePage, U, ByteCount);
+  Result := Length(U);
+  if CharCount < Result then
+    Result := CharCount;
+  if Result > 0 then
+    Move(U[1], Chars[0], Result * SizeOf(UnicodeChar));
+end;
+
+function TMBCSEncoding.GetCodePage: Cardinal;
+begin
+  Result := FCodePage;
+end;
+
+function TMBCSEncoding.GetEncodingName: UnicodeString;
+begin
+  Result := CodePageToCodePageName(CodePage);
+end;
+
+constructor TMBCSEncoding.Create;
+begin
+  Create(DefaultSystemCodePage, 0, 0);
+end;
+
+constructor TMBCSEncoding.Create(ACodePage: Integer);
+begin
+  Create(ACodePage, 0, 0);
+end;
+
+constructor TMBCSEncoding.Create(ACodePage, MBToWCharFlags,
+  WCharToMBFlags: Integer);
+begin
+  FCodePage := ACodePage;
+  FMBToWCharFlags := MBToWCharFlags;
+  FWCharToMBFlags := WCharToMBFlags;
+end;
+
+function TMBCSEncoding.Clone: TEncoding;
+begin
+  Result := TMBCSEncoding.Create(FCodePage, FMBToWCharFlags, FWCharToMBFlags);
+end;
+
+function TMBCSEncoding.GetMaxByteCount(CharCount: Integer): Integer;
+begin
+  Result := CharCount;
+end;
+
+function TMBCSEncoding.GetMaxCharCount(ByteCount: Integer): Integer;
+begin
+  Result := ByteCount;
+end;
+
+function TMBCSEncoding.GetPreamble: TBytes;
+begin
+  Result := nil;
+end;
+
+{ TUTF7Encoding }
+
+constructor TUTF7Encoding.Create;
+begin
+  inherited Create(CP_UTF7);
+  FIsSingleByte := False;
+end;
+
+function TUTF7Encoding.Clone: TEncoding;
+begin
+  Result := TUTF7Encoding.Create;
+end;
+
+function TUTF7Encoding.GetMaxByteCount(CharCount: Integer): Integer;
+begin
+  Result := CharCount * 3 + 2;
+end;
+
+function TUTF7Encoding.GetMaxCharCount(ByteCount: Integer): Integer;
+begin
+  Result := ByteCount;
+end;
+
+{ TUTF8Encoding }
+
+constructor TUTF8Encoding.Create;
+begin
+  inherited Create(CP_UTF8);
+  FIsSingleByte := False;
+end;
+
+function TUTF8Encoding.Clone: TEncoding;
+begin
+  Result := TUTF8Encoding.Create;
+end;
+
+function TUTF8Encoding.GetMaxByteCount(CharCount: Integer): Integer;
+begin
+  Result := CharCount * 3;
+end;
+
+function TUTF8Encoding.GetMaxCharCount(ByteCount: Integer): Integer;
+begin
+  Result := ByteCount;
+end;
+
+function TUTF8Encoding.GetPreamble: TBytes;
+begin
+  SetLength(Result, 3);
+  Result[0] := $EF;
+  Result[1] := $BB;
+  Result[2] := $BF;
+end;
+
+{ TUnicodeEncoding }
+
+function TUnicodeEncoding.GetByteCount(Chars: PUnicodeChar; CharCount: Integer): Integer;
+begin
+  Result := CharCount * SizeOf(UnicodeChar);
+end;
+
+function TUnicodeEncoding.GetBytes(Chars: PUnicodeChar; CharCount: Integer;
+  Bytes: PByte; ByteCount: Integer): Integer;
+begin
+  Result := CharCount * SizeOf(UnicodeChar);
+  if ByteCount < Result then
+    Result := ByteCount;
+  if Result > 0 then
+    Move(Chars[0], Bytes[0], Result);
+end;
+
+function TUnicodeEncoding.GetCharCount(Bytes: PByte; ByteCount: Integer): Integer;
+begin
+  Result := ByteCount div SizeOf(UnicodeChar);
+end;
+
+function TUnicodeEncoding.GetChars(Bytes: PByte; ByteCount: Integer;
+  Chars: PUnicodeChar; CharCount: Integer): Integer;
+begin
+  Result := ByteCount div 2;
+  if CharCount < Result then
+    Result := CharCount;
+  Move(Bytes[0], Chars[0], Result * SizeOf(UnicodeChar));
+end;
+
+function TUnicodeEncoding.GetCodePage: Cardinal;
+begin
+  Result := CP_UTF16;
+end;
+
+function TUnicodeEncoding.GetEncodingName: UnicodeString;
+begin
+  Result := CodePageToCodePageName(CodePage);
+end;
+
+constructor TUnicodeEncoding.Create;
+begin
+  inherited Create;
+  FIsSingleByte := False;
+  FMaxCharSize := SizeOf(UnicodeChar);
+end;
+
+function TUnicodeEncoding.Clone: TEncoding;
+begin
+  Result := TUnicodeEncoding.Create;
+end;
+
+function TUnicodeEncoding.GetMaxByteCount(CharCount: Integer): Integer;
+begin
+  Result := CharCount * SizeOf(UnicodeChar);
+end;
+
+function TUnicodeEncoding.GetMaxCharCount(ByteCount: Integer): Integer;
+begin
+  Result := ByteCount div SizeOf(UnicodeChar);
+end;
+
+function TUnicodeEncoding.GetPreamble: TBytes;
+begin
+  SetLength(Result, 2);
+  Result[0] := $FF;
+  Result[1] := $FE;
+end;
+
+{ TBigEndianUnicodeEncoding }
+
+function TBigEndianUnicodeEncoding.GetBytes(Chars: PUnicodeChar; CharCount: Integer;
+  Bytes: PByte; ByteCount: Integer): Integer;
+var
+  LastByte: PByte;
+begin
+  Result := CharCount * SizeOf(UnicodeChar);
+  if ByteCount < Result then
+    Result := ByteCount;
+  LastByte := @Bytes[Result];
+  while Bytes < LastByte do
+  begin
+    Bytes^ := Hi(Word(Chars^));
+    inc(Bytes);
+    if Bytes < LastByte then
+      Bytes^ := Lo(Word(Chars^));
+    inc(Bytes);
+    inc(Chars);
+  end;
+end;
+
+function TBigEndianUnicodeEncoding.GetChars(Bytes: PByte; ByteCount: Integer;
+  Chars: PUnicodeChar; CharCount: Integer): Integer;
+var
+  LastChar: PUnicodeChar;
+begin
+  Result := ByteCount div SizeOf(UnicodeChar);
+  if CharCount < Result then
+    Result := CharCount;
+  LastChar := @Chars[Result];
+  while Chars <= LastChar do
+  begin
+    Chars^ := UnicodeChar(Bytes[1] + Bytes[0] shl 8);
+    inc(Bytes, SizeOf(UnicodeChar));
+    inc(Chars);
+  end;
+end;
+
+function TBigEndianUnicodeEncoding.GetCodePage: Cardinal;
+begin
+  Result := CP_UTF16BE;
+end;
+
+function TBigEndianUnicodeEncoding.GetEncodingName: UnicodeString;
+begin
+  Result := CodePageToCodePageName(CodePage);
+end;
+
+function TBigEndianUnicodeEncoding.Clone: TEncoding;
+begin
+  Result := TBigEndianUnicodeEncoding.Create;
+end;
+
+function TBigEndianUnicodeEncoding.GetPreamble: TBytes;
+begin
+  SetLength(Result, 2);
+  Result[0] := $FE;
+  Result[1] := $FF;
+end;
+{$endif VER2_4}

+ 161 - 0
rtl/objpas/sysutils/sysencodingh.inc

@@ -0,0 +1,161 @@
+{$ifndef VER2_4}
+type
+  EEncodingError = class(Exception);
+
+  { TEncoding }
+
+  TEncoding = class
+  strict private
+    type
+      TStandardEncoding = (
+        seAnsi,
+        seAscii,
+        seUnicode,
+        seBigEndianUnicode,
+        seUTF7,
+        seUTF8);
+    var
+      FStandardEncodings: array[TStandardEncoding] of TEncoding; static;
+
+    class function GetANSI: TEncoding; static;
+    class function GetASCII: TEncoding; static;
+    class function GetBigEndianUnicode: TEncoding; static;
+    class function GetDefault: TEncoding; static;
+    class function GetUnicode: TEncoding; static;
+    class function GetUTF7: TEncoding; static;
+    class function GetUTF8: TEncoding; static;
+
+    class constructor Create;
+    class destructor Destroy;
+  strict protected
+    FIsSingleByte: Boolean;
+    FMaxCharSize: Integer;
+    function GetByteCount(Chars: PUnicodeChar; CharCount: Integer): Integer; overload; virtual; abstract;
+    function GetBytes(Chars: PUnicodeChar; CharCount: Integer; Bytes: PByte; ByteCount: Integer): Integer; overload; virtual; abstract;
+    function GetCharCount(Bytes: PByte; ByteCount: Integer): Integer; overload; virtual; abstract;
+    function GetChars(Bytes: PByte; ByteCount: Integer; Chars: PUnicodeChar; CharCount: Integer): Integer; overload; virtual; abstract;
+    function GetCodePage: Cardinal; virtual; abstract;
+    function GetEncodingName: UnicodeString; virtual; abstract;
+  public
+    class procedure FreeEncodings;
+    function Clone: TEncoding; virtual;
+    class function Convert(Source, Destination: TEncoding; const Bytes: TBytes): TBytes; overload;
+    class function Convert(Source, Destination: TEncoding; const Bytes: TBytes; StartIndex, Count: Integer): TBytes; overload;
+    class function IsStandardEncoding(AEncoding: TEncoding): Boolean; static;
+    class function GetBufferEncoding(const Buffer: TBytes; var AEncoding: TEncoding): Integer; overload; static;
+    class function GetBufferEncoding(const Buffer: TBytes; var AEncoding: TEncoding;
+      ADefaultEncoding: TEncoding): Integer; overload; static;
+    function GetByteCount(const Chars: TUnicodeCharArray): Integer; overload;
+    function GetByteCount(const Chars: TUnicodeCharArray; CharIndex, CharCount: Integer): Integer; overload;
+    function GetByteCount(const S: UnicodeString): Integer; overload;
+    function GetByteCount(const S: UnicodeString; CharIndex, CharCount: Integer): Integer; overload;
+    function GetBytes(const Chars: TUnicodeCharArray): TBytes; overload;
+    function GetBytes(const Chars: TUnicodeCharArray; CharIndex, CharCount: Integer): TBytes; overload;
+    function GetBytes(const Chars: TUnicodeCharArray; CharIndex, CharCount: Integer;
+      const Bytes: TBytes; ByteIndex: Integer): Integer; overload;
+    function GetBytes(const S: UnicodeString): TBytes; overload;
+    function GetBytes(const S: UnicodeString; CharIndex, CharCount: Integer;
+      const Bytes: TBytes; ByteIndex: Integer): Integer; overload;
+    function GetCharCount(const Bytes: TBytes): Integer; overload;
+    function GetCharCount(const Bytes: TBytes; ByteIndex, ByteCount: Integer): Integer; overload;
+    function GetChars(const Bytes: TBytes): TUnicodeCharArray; overload;
+    function GetChars(const Bytes: TBytes; ByteIndex, ByteCount: Integer): TUnicodeCharArray; overload;
+    function GetChars(const Bytes: TBytes; ByteIndex, ByteCount: Integer;
+      const Chars: TUnicodeCharArray; CharIndex: Integer): Integer; overload;
+    class function GetEncoding(CodePage: Integer): TEncoding; overload; static;
+    class function GetEncoding(const EncodingName: UnicodeString): TEncoding; overload; static;
+    function GetMaxByteCount(CharCount: Integer): Integer; virtual; abstract;
+    function GetMaxCharCount(ByteCount: Integer): Integer; virtual; abstract;
+    function GetPreamble: TBytes; virtual; abstract;
+    function GetString(const Bytes: TBytes): UnicodeString; overload;
+    function GetString(const Bytes: TBytes; ByteIndex, ByteCount: Integer): UnicodeString; overload;
+
+    property CodePage: Cardinal read GetCodePage;
+    property EncodingName: UnicodeString read GetEncodingName;
+    property IsSingleByte: Boolean read FIsSingleByte;
+
+    class property ANSI: TEncoding read GetANSI;
+    class property ASCII: TEncoding read GetASCII;
+    class property BigEndianUnicode: TEncoding read GetBigEndianUnicode;
+    class property Default: TEncoding read GetDefault;
+    class property Unicode: TEncoding read GetUnicode;
+    class property UTF7: TEncoding read GetUTF7;
+    class property UTF8: TEncoding read GetUTF8;
+  end;
+
+  { TMBCSEncoding }
+
+  TMBCSEncoding = class(TEncoding)
+  strict private
+    FCodePage: Integer;
+    FMBToWCharFlags: Integer;
+    FWCharToMBFlags: Integer;
+  strict protected
+    function GetByteCount(Chars: PUnicodeChar; CharCount: Integer): Integer; overload; override;
+    function GetBytes(Chars: PUnicodeChar; CharCount: Integer; Bytes: PByte; ByteCount: Integer): Integer; overload; override;
+    function GetCharCount(Bytes: PByte; ByteCount: Integer): Integer; overload; override;
+    function GetChars(Bytes: PByte; ByteCount: Integer; Chars: PUnicodeChar; CharCount: Integer): Integer; overload; override;
+    function GetCodePage: Cardinal; override;
+    function GetEncodingName: UnicodeString; override;
+  public
+    constructor Create; overload; virtual;
+    constructor Create(ACodePage: Integer); overload; virtual;
+    constructor Create(ACodePage, MBToWCharFlags, WCharToMBFlags: Integer); overload; virtual;
+    function Clone: TEncoding; override;
+    function GetMaxByteCount(CharCount: Integer): Integer; override;
+    function GetMaxCharCount(ByteCount: Integer): Integer; override;
+    function GetPreamble: TBytes; override;
+  end;
+
+  { TUTF7Encoding }
+
+  TUTF7Encoding = class(TMBCSEncoding)
+  public
+    constructor Create; override;
+    function Clone: TEncoding; override;
+    function GetMaxByteCount(CharCount: Integer): Integer; override;
+    function GetMaxCharCount(ByteCount: Integer): Integer; override;
+  end;
+
+  { TUTF8Encoding }
+
+  TUTF8Encoding = class(TUTF7Encoding)
+  public
+    constructor Create; override;
+    function Clone: TEncoding; override;
+    function GetMaxByteCount(CharCount: Integer): Integer; override;
+    function GetMaxCharCount(ByteCount: Integer): Integer; override;
+    function GetPreamble: TBytes; override;
+  end;
+
+  { TUnicodeEncoding }
+
+  TUnicodeEncoding = class(TEncoding)
+  strict protected
+    function GetByteCount(Chars: PUnicodeChar; CharCount: Integer): Integer; overload; override;
+    function GetBytes(Chars: PUnicodeChar; CharCount: Integer; Bytes: PByte; ByteCount: Integer): Integer; overload; override;
+    function GetCharCount(Bytes: PByte; ByteCount: Integer): Integer; overload; override;
+    function GetChars(Bytes: PByte; ByteCount: Integer; Chars: PUnicodeChar; CharCount: Integer): Integer; overload; override;
+    function GetCodePage: Cardinal; override;
+    function GetEncodingName: UnicodeString; override;
+  public
+    constructor Create; virtual;
+    function Clone: TEncoding; override;
+    function GetMaxByteCount(CharCount: Integer): Integer; override;
+    function GetMaxCharCount(ByteCount: Integer): Integer; override;
+    function GetPreamble: TBytes; override;
+  end;
+
+  { TBigEndianUnicodeEncoding }
+
+  TBigEndianUnicodeEncoding = class(TUnicodeEncoding)
+  strict protected
+    function GetBytes(Chars: PUnicodeChar; CharCount: Integer; Bytes: PByte; ByteCount: Integer): Integer; overload; override;
+    function GetChars(Bytes: PByte; ByteCount: Integer; Chars: PUnicodeChar; CharCount: Integer): Integer; overload; override;
+    function GetCodePage: Cardinal; override;
+    function GetEncodingName: UnicodeString; override;
+  public
+    function Clone: TEncoding; override;
+    function GetPreamble: TBytes; override;
+  end;
+{$endif VER2_4}

+ 2 - 0
rtl/objpas/sysutils/sysutilh.inc

@@ -268,6 +268,7 @@ Type
 
   { MCBS functions }
   {$i sysansih.inc}
+  {$i syscodepagesh.inc}
 
   { wide string functions }
   {$i syswideh.inc}
@@ -275,6 +276,7 @@ Type
 {$ifdef FPC_HAS_UNICODESTRING}
   { unicode string functions }
   {$i sysunih.inc}
+  {$i sysencodingh.inc}
 {$endif FPC_HAS_UNICODESTRING}
 
   { Read filename handling functions declaration }

+ 2 - 0
rtl/objpas/sysutils/sysutils.inc

@@ -129,6 +129,7 @@
 
   { MCBS functions }
   {$i sysansi.inc}
+  {$i syscodepages.inc}
 
   { wide string functions }
   {$i syswide.inc}
@@ -136,6 +137,7 @@
 {$ifdef FPC_HAS_UNICODESTRING}
   { unicode string functions }
   {$i sysuni.inc}
+  {$i sysencoding.inc}
 {$endif FPC_HAS_UNICODESTRING}
   
   { threading stuff }