123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782 |
- {
- $Id$
- This file is part of the Free Pascal run time library.
- Copyright (c) 1999-2001 by Florian Klaempfl,
- member of the Free Pascal development team.
- This file implements support routines for WideStrings with FPC
- See the file COPYING.FPC, included in this distribution,
- for details about the copyright.
- This program is distributed in the hope that it will be useful,
- but WITHOUT ANY WARRANTY; without even the implied warranty of
- MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
- **********************************************************************}
- {
- This file contains the implementation of the WideString type,
- and all things that are needed for it.
- WideString is defined as a 'silent' pwidechar :
- a pwidechar that points to :
- @-12 : Longint for maximum size;
- @-8 : Longint for size;
- @-4 : Longint for reference count;
- @ : String + Terminating #0;
- Pwidechar(Widestring) is a valid typecast.
- So WS[i] is converted to the address @WS+i-1.
- Constants should be assigned a reference count of -1
- Meaning that they can't be disposed of.
- }
- Type
- PWideRec = ^TWideRec;
- TWideRec = Packed Record
- Maxlen,
- len,
- ref : Longint;
- First : WideChar;
- end;
- Const
- WideRecLen = SizeOf(TWideRec);
- WideFirstOff = SizeOf(TWideRec)-sizeof(WideChar);
- {
- Default WideChar <-> Char conversion is to only convert the
- lower 127 chars, all others are translated to spaces.
- These routines can be overwritten for the Current Locale
- }
- procedure Wide2AnsiMove(source:pwidechar;dest:pchar;len:longint);
- var
- i : longint;
- begin
- for i:=1to len do
- begin
- if word(source^)<128 then
- dest^:=char(word(source^))
- else
- dest^:=' ';
- inc(dest);
- inc(source);
- end;
- end;
- procedure Ansi2WideMove(source:pchar;dest:pwidechar;len:longint);
- var
- i : longint;
- begin
- for i:=1to len do
- begin
- if byte(source^)<128 then
- dest^:=widechar(byte(source^))
- else
- dest^:=' ';
- inc(dest);
- inc(source);
- end;
- end;
- Type
- TWide2AnsiMove=procedure(source:pwidechar;dest:pchar;len:longint);
- TAnsi2WideMove=procedure(source:pchar;dest:pwidechar;len:longint);
- Const
- Wide2AnsiMoveProc:TWide2AnsiMove=@Wide2AnsiMove;
- Ansi2WideMoveProc:TAnsi2WideMove=@Ansi2WideMove;
- (*
- Procedure UniqueWideString(Var S : WideString); [Public,Alias : 'FPC_WIDESTR_UNIQUE'];
- {
- Make sure reference count of S is 1,
- using copy-on-write semantics.
- }
- begin
- end;
- *)
- {****************************************************************************
- Internal functions, not in interface.
- ****************************************************************************}
- {$ifdef WideStrDebug}
- Procedure DumpWideRec(S : Pointer);
- begin
- If S=Nil then
- Writeln ('String is nil')
- Else
- Begin
- With PWideRec(S-WideFirstOff)^ do
- begin
- Write ('(Maxlen: ',maxlen);
- Write (' Len:',len);
- Writeln (' Ref: ',ref,')');
- end;
- end;
- end;
- {$endif}
- Function NewWideString(Len : Longint) : Pointer;
- {
- Allocate a new WideString on the heap.
- initialize it to zero length and reference count 1.
- }
- Var
- P : Pointer;
- begin
- { Also add +1 for a terminating zero }
- GetMem(P,Len+Len+WideRecLen);
- If P<>Nil then
- begin
- PWideRec(P)^.Maxlen:=Len; { Maximal length }
- PWideRec(P)^.Len:=0; { Initial length }
- PWideRec(P)^.Ref:=1; { Set reference count }
- PWideRec(P)^.First:=#0; { Terminating #0 }
- inc(p,WideFirstOff); { Points to string now }
- end;
- NewWideString:=P;
- end;
- Procedure DisposeWideString(Var S : Pointer);
- {
- Deallocates a WideString From the heap.
- }
- begin
- If S=Nil then
- exit;
- Dec (Longint(S),WideFirstOff);
- FreeMem (S);
- S:=Nil;
- end;
- Procedure WideStr_Decr_Ref (Var S : Pointer);[Public,Alias:'FPC_WIDESTR_DECR_REF'];
- {
- Decreases the ReferenceCount of a non constant widestring;
- If the reference count is zero, deallocate the string;
- }
- Type
- plongint = ^longint;
- Var
- l : plongint;
- Begin
- { Zero string }
- If S=Nil then exit;
- { check for constant strings ...}
- l:=@PWIDEREC(S-WideFirstOff)^.Ref;
- If l^<0 then exit;
- { declocked does a MT safe dec and returns true, if the counter is 0 }
- If declocked(l^) then
- { Ref count dropped to zero }
- DisposeWideString (S); { Remove...}
- { this pointer is not valid anymore, so set it to zero }
- S:=nil;
- end;
- Procedure WideStr_Incr_Ref (Var S : Pointer);[Public,Alias:'FPC_WIDESTR_INCR_REF'];
- Begin
- If S=Nil then
- exit;
- { Let's be paranoid : Constant string ??}
- If PWideRec(S-WideFirstOff)^.Ref<0 then exit;
- inclocked(PWideRec(S-WideFirstOff)^.Ref);
- end;
- Procedure WideStr_To_ShortStr (Var S1 : ShortString;S2 : Pointer);[Public, alias: 'FPC_WIDESTR_TO_SHORTSTR'];
- {
- Converts a WideString to a ShortString;
- }
- Var
- Size : Longint;
- begin
- if S2=nil then
- S1:=''
- else
- begin
- Size:=PAnsiRec(S2-FirstOff)^.Len;
- If Size>high(S1) then
- Size:=high(S1);
- Wide2AnsiMoveProc(PWideChar(S2),PChar(@S1[1]),Size);
- byte(S1[0]):=Size;
- end;
- end;
- Procedure ShortStr_To_WideStr (Var S1 : Pointer; Const S2 : ShortString);[Public, alias: 'FPC_SHORTSTR_TO_WIDESTR'];
- {
- Converts a ShortString to a WideString;
- }
- Var
- Size : Longint;
- begin
- Size:=Length(S2);
- Setlength (WideString(S1),Size);
- if Size>0 then
- Ansi2WideMoveProc(PChar(@S2[1]),PWideChar(S1),Size);
- end;
- Procedure WideStr_To_AnsiStr (Var S1 : Pointer;S2 : Pointer);[Public, alias: 'FPC_WIDESTR_TO_ANSISTR'];
- {
- Converts a WideString to an AnsiString
- }
- Var
- Size : Longint;
- begin
- if s2=nil then
- s1:=nil
- else
- begin
- Size:=Length(WideString(S2));
- Setlength (AnsiString(S1),Size);
- if Size>0 then
- begin
- Wide2AnsiMoveProc(PWideChar(S2),PChar(S1),Size);
- { Terminating Zero }
- PChar(S1+Size)^:=#0;
- end;
- end;
- end;
- Procedure AnsiStr_To_WideStr (Var S1 : Pointer; Const S2 : Pointer);[Public, alias: 'FPC_ANSISTR_TO_WIDESTR'];
- {
- Converts an AnsiString to a WideString;
- }
- Var
- Size : Longint;
- begin
- if s2=nil then
- s1:=nil
- else
- begin
- Size:=Length(AnsiString(S2));
- Setlength (WideString(S1),Size);
- if Size>0 then
- begin
- Ansi2WideMoveProc(PChar(S2),PWideChar(S1),Size);
- { Terminating Zero }
- PWideChar(S1+Size*sizeof(WideChar))^:=#0;
- end;
- end;
- end;
- { checked against the ansistring routine, 2001-05-27 (FK) }
- Procedure WideStr_Assign (Var S1 : Pointer;S2 : Pointer);[Public,Alias:'FPC_WIDESTR_ASSIGN'];
- {
- Assigns S2 to S1 (S1:=S2), taking in account reference counts.
- }
- begin
- If S2<>nil then
- If PWideRec(S2-WideFirstOff)^.Ref>0 then
- Inc(PWideRec(S2-WideFirstOff)^.ref);
- { Decrease the reference count on the old S1 }
- widestr_decr_ref (S1);
- { And finally, have S1 pointing to S2 (or its copy) }
- S1:=S2;
- end;
- { checked against the ansistring routine, 2001-05-27 (FK) }
- Procedure WideStr_Concat (S1,S2 : Pointer;var S3 : Pointer);[Public, alias: 'FPC_WIDESTR_CONCAT'];
- {
- Concatenates 2 WideStrings : S1+S2.
- Result Goes to S3;
- }
- Var
- Size,Location : Longint;
- begin
- { create new result }
- if S3<>nil then
- WideStr_Decr_Ref(S3);
- { only assign if s1 or s2 is empty }
- if (S1=Nil) then
- WideStr_Assign(S3,S2)
- else
- if (S2=Nil) then
- WideStr_Assign(S3,S1)
- else
- begin
- Size:=PWideRec(S2-WideFirstOff)^.Len;
- Location:=Length(WideString(S1));
- SetLength (WideString(S3),Size+Location);
- Move (S1^,S3^,Location*sizeof(WideChar));
- Move (S2^,(S3+location*sizeof(WideChar))^,(Size+1)*sizeof(WideChar));
- end;
- end;
- Procedure Char_To_WideStr(var S1 : Pointer; c : Char);[Public, alias: 'FPC_CHAR_TO_WIDESTR'];
- {
- Converts a Char to a WideString;
- }
- begin
- Setlength (WideString(S1),1);
- PWideChar(S1)^:=c;
- { Terminating Zero }
- PWideChar(S1+sizeof(WideChar))^:=#0;
- end;
- Procedure PChar_To_WideStr(var a : widestring;p : pchar);[Public,Alias : 'FPC_PCHAR_TO_WIDESTR'];
- Var
- L : Longint;
- begin
- if pointer(a)<>nil then
- begin
- WideStr_Decr_Ref(Pointer(a));
- pointer(a):=nil;
- end;
- if (not assigned(p)) or (p[0]=#0) Then
- Pointer(a):=nil
- else
- begin
- l:=IndexChar(p^,-1,#0);
- Pointer(a):=NewWidestring(L);
- SetLength(A,L);
- Ansi2WideMoveProc(P,PWideChar(A),L);
- end;
- end;
- Procedure CharArray_To_WideStr(var a : widestring;p : pchar;l:longint);[Public,Alias : 'FPC_CHARARRAY_TO_WIDESTR'];
- var
- i : longint;
- begin
- if p[0]=#0 Then
- Pointer(a):=nil
- else
- begin
- i:=IndexChar(p^,L,#0);
- Pointer(a):=NewWidestring(i);
- SetLength(a,i);
- Ansi2WideMoveProc(P,PWideChar(A),i);
- end;
- end;
- Function WideStr_Compare(S1,S2 : Pointer): Longint;[Public,Alias : 'FPC_WIDESTR_COMPARE'];
- {
- Compares 2 WideStrings;
- The result is
- <0 if S1<S2
- 0 if S1=S2
- >0 if S1>S2
- }
- Var
- MaxI,Temp : Longint;
- begin
- if S1=S2 then
- begin
- WideStr_Compare:=0;
- exit;
- end;
- Maxi:=Length(WideString(S1));
- temp:=Length(WideString(S2));
- If MaxI>Temp then
- MaxI:=Temp;
- Temp:=CompareWord(S1^,S2^,MaxI);
- if temp=0 then
- temp:=Length(WideString(S1))-Length(WideString(S2));
- WideStr_Compare:=Temp;
- end;
- Procedure WideStr_CheckZero(p : pointer);[Public,Alias : 'FPC_WIDESTR_CHECKZERO'];
- begin
- if p=nil then
- HandleErrorFrame(201,get_frame);
- end;
- Procedure WideStr_CheckRange(len,index : longint);[Public,Alias : 'FPC_WIDESTR_RANGECHECK'];
- begin
- if (index>len) or (Index<1) then
- HandleErrorFrame(201,get_frame);
- end;
- {$ifndef INTERNSETLENGTH}
- Procedure SetLength (Var S : WideString; l : Longint);
- {$else INTERNSETLENGTH}
- Procedure WideStr_SetLength (Var S : WideString; l : Longint);[Public,Alias : 'FPC_WIDESTR_SETLENGTH'];
- {$endif INTERNSETLENGTH}
- {
- Sets The length of string S to L.
- Makes sure S is unique, and contains enough room.
- }
- Var
- Temp : Pointer;
- begin
- if (l>0) then
- begin
- if Pointer(S)=nil then
- begin
- { Need a complete new string...}
- Pointer(s):=NewWideString(l);
- end
- else
- If (PWideRec(Pointer(S)-WideFirstOff)^.Maxlen < L) or
- (PWideRec(Pointer(S)-WideFirstOff)^.Ref <> 1) then
- begin
- { Reallocation is needed... }
- Temp:=Pointer(NewWideString(L));
- if Length(S)>0 then
- Move(Pointer(S)^,Temp^,L*sizeof(WideChar));
- WideStr_decr_ref(Pointer(S));
- Pointer(S):=Temp;
- end;
- { Force nil termination in case it gets shorter }
- PWideChar(Pointer(S)+l*sizeof(WideChar))^:=#0;
- PWideRec(Pointer(S)-WideFirstOff)^.Len:=l;
- end
- else
- begin
- { Length=0 }
- if Pointer(S)<>nil then
- WideStr_decr_ref (Pointer(S));
- Pointer(S):=Nil;
- end;
- end;
- {*****************************************************************************
- Public functions, In interface.
- *****************************************************************************}
- {$ifndef INTERNLENGTH}
- Function Length (Const S : WideString) : Longint;
- {
- Returns the length of an WideString.
- Takes in acount that zero strings are NIL;
- }
- begin
- If Pointer(S)=Nil then
- Length:=0
- else
- Length:=PWideRec(Pointer(S)-WideFirstOff)^.Len;
- end;
- {$endif INTERNLENGTH}
- Procedure UniqueString(Var S : WideString); [Public,Alias : 'FPC_WIDESTR_UNIQUE'];
- {
- Make sure reference count of S is 1,
- using copy-on-write semantics.
- }
- Var
- SNew : Pointer;
- L : Longint;
- begin
- If Pointer(S)=Nil then
- exit;
- if PWideRec(Pointer(S)-WideFirstOff)^.Ref<>1 then
- begin
- L:=PWideRec(Pointer(S)-WideFirstOff)^.len;
- SNew:=NewWideString (L);
- Move (PWideChar(S)^,SNew^,(L+1)*sizeof(WideChar));
- PWideRec(SNew-WideFirstOff)^.len:=L;
- widestr_decr_ref (Pointer(S)); { Thread safe }
- Pointer(S):=SNew;
- end;
- end;
- Function Copy (Const S : WideString; Index,Size : Longint) : WideString;
- var
- ResultAddress : Pointer;
- begin
- ResultAddress:=Nil;
- dec(index);
- if Index < 0 then
- Index := 0;
- { Check Size. Accounts for Zero-length S, the double check is needed because
- Size can be maxint and will get <0 when adding index }
- if (Size>Length(S)) or
- (Index+Size>Length(S)) then
- Size:=Length(S)-Index;
- If Size>0 then
- begin
- If Index<0 Then
- Index:=0;
- ResultAddress:=Pointer(NewWideString (Size));
- if ResultAddress<>Nil then
- begin
- Move (PWideChar(S)[Index],ResultAddress^,Size*sizeof(WideChar));
- PWideRec(ResultAddress-WideFirstOff)^.Len:=Size;
- PWideChar(ResultAddress+Size*sizeof(WideChar))^:=#0;
- end;
- end;
- Pointer(Copy):=ResultAddress;
- end;
- Function Pos (Const Substr : WideString; Const Source : WideString) : Longint;
- var
- i,MaxLen : StrLenInt;
- pc : pwidechar;
- begin
- Pos:=0;
- if Length(SubStr)>0 then
- begin
- MaxLen:=Length(source)-Length(SubStr);
- i:=0;
- pc:=@source[1];
- while (i<=MaxLen) do
- begin
- inc(i);
- if (SubStr[1]=pc^) and
- (CompareWord(Substr[1],pc^,Length(SubStr))=0) then
- begin
- Pos:=i;
- exit;
- end;
- inc(pc);
- end;
- end;
- end;
- { Faster version for a widechar alone }
- Function Pos (c : WideChar; Const s : WideString) : Longint;
- var
- i: longint;
- pc : pwidechar;
- begin
- pc:=@s[1];
- for i:=1 to length(s) do
- begin
- if pc^=c then
- begin
- pos:=i;
- exit;
- end;
- inc(pc);
- end;
- pos:=0;
- end;
- { Faster version for a char alone. Must be implemented because }
- { pos(c: char; const s: shortstring) also exists, so otherwise }
- { using pos(char,pchar) will always call the shortstring version }
- { (exact match for first argument), also with $h+ (JM) }
- Function Pos (c : Char; Const s : WideString) : Longint;
- var
- i: longint;
- wc : widechar;
- pc : pwidechar;
- begin
- wc:=c;
- pc:=@s[1];
- for i:=1 to length(s) do
- begin
- if pc^=wc then
- begin
- pos:=i;
- exit;
- end;
- inc(pc);
- end;
- pos:=0;
- end;
- Procedure Delete (Var S : WideString; Index,Size: Longint);
- Var
- LS : Longint;
- begin
- If Length(S)=0 then
- exit;
- if index<=0 then
- begin
- inc(Size,index-1);
- index:=1;
- end;
- LS:=PWideRec(Pointer(S)-WideFirstOff)^.Len;
- if (Index<=LS) and (Size>0) then
- begin
- UniqueString (S);
- if Size+Index>LS then
- Size:=LS-Index+1;
- if Index+Size<=LS then
- begin
- Dec(Index);
- Move(PWideChar(S)[Index+Size],PWideChar(S)[Index],(LS-Index+1)*sizeof(WideChar));
- end;
- Setlength(s,LS-Size);
- end;
- end;
- Procedure Insert (Const Source : WideString; Var S : WideString; Index : Longint);
- var
- Temp : WideString;
- LS : Longint;
- begin
- If Length(Source)=0 then
- exit;
- if index <= 0 then
- index := 1;
- Ls:=Length(S);
- if index > LS then
- index := LS+1;
- Dec(Index);
- Pointer(Temp) := NewWideString(Length(Source)+LS);
- SetLength(Temp,Length(Source)+LS);
- If Index>0 then
- move (PWideChar(S)^,PWideChar(Temp)^,Index*sizeof(WideChar));
- Move (PWideChar(Source)^,PWideChar(Temp)[Index],Length(Source)*sizeof(WideChar));
- If (LS-Index)>0 then
- Move(PWideChar(S)[Index],PWideChar(temp)[Length(Source)+index],(LS-Index)*sizeof(WideChar));
- S:=Temp;
- end;
- {!!!:Procedure SetString (Var S : WideString; Buf : PWideChar; Len : Longint);
- begin
- SetLength(S,Len);
- Move (Buf[0],S[1],Len*2);
- end;}
- Function ValWideFloat(Const S : WideString; Var Code : ValSInt): ValReal; [public, alias:'FPC_VAL_REAL_ANSISTR'];
- Var
- SS : String;
- begin
- WideStr_To_ShortStr(SS,Pointer(S));
- ValWideFloat := ValFloat(SS,Code);
- end;
- Function ValWideUnsignedInt (Const S : WideString; Var Code : ValSInt): ValUInt; [public, alias:'FPC_VAL_UINT_ANSISTR'];
- Var
- SS : ShortString;
- begin
- WideStr_To_ShortStr(SS,Pointer(S));
- ValWideUnsignedInt := ValUnsignedInt(SS,Code);
- end;
- Function ValWideSignedInt (DestSize: longint; Const S : WideString; Var Code : ValSInt): ValSInt; [public, alias:'FPC_VAL_SINT_ANSISTR'];
- Var
- SS : ShortString;
- begin
- ValWideSignedInt:=0;
- if length(S)>255 then
- code:=256
- else
- begin
- WideStr_To_ShortStr (SS,Pointer(S));
- ValWideSignedInt := ValSignedInt(DestSize,SS,Code);
- end;
- end;
- Function ValWideUnsignedint64 (Const S : WideString; Var Code : ValSInt): qword; [public, alias:'FPC_VAL_QWORD_ANSISTR'];
- Var
- SS : ShortString;
- begin
- ValWideUnsignedInt64:=0;
- if length(S)>255 then
- code:=256
- else
- begin
- WideStr_To_ShortStr(SS,Pointer(S));
- ValWideUnsignedInt64 := ValQWord(SS,Code);
- end;
- end;
- Function ValWideSignedInt64 (Const S : WideString; Var Code : ValSInt): Int64; [public, alias:'FPC_VAL_INT64_ANSISTR'];
- Var
- SS : ShortString;
- begin
- ValWideSignedInt64:=0;
- if length(S)>255 then
- code:=256
- else
- begin
- WideStr_To_ShortStr (SS,Pointer(S));
- ValWideSignedInt64 := valInt64(SS,Code);
- end;
- end;
- procedure WideStr_Float(d : ValReal;len,fr,rt : longint;var s : WideString);[public,alias:'FPC_WIDESTR_FLOAT'];
- var
- ss : shortstring;
- begin
- str_real(len,fr,d,treal_type(rt),ss);
- s:=ss;
- end;
- Procedure WideStr_Cardinal(C : Cardinal;Len : Longint; Var S : WideString);[Public,Alias : 'FPC_WIDESTR_CARDINAL'];
- Var
- SS : ShortString;
- begin
- int_str_cardinal(C,Len,SS);
- S:=SS;
- end;
- Procedure WideStr_Longint(L : Longint; Len : Longint; Var S : WideString);[Public,Alias : 'FPC_WIDESTR_LONGINT'];
- Var
- SS : ShortString;
- begin
- int_Str_Longint (L,Len,SS);
- S:=SS;
- end;
- {
- $Log$
- Revision 1.9 2001-07-09 21:15:41 peter
- * Length made internal
- * Add array support for Length
- Revision 1.8 2001/07/08 21:00:18 peter
- * various widestring updates, it works now mostly without charset
- mapping supported
- Revision 1.7 2001/05/27 14:28:03 florian
- + some procedures added
- Revision 1.6 2000/11/06 23:17:15 peter
- * removed some warnings
- Revision 1.5 2000/11/06 20:34:24 peter
- * changed ver1_0 defines to temporary defs
- Revision 1.4 2000/10/21 18:20:17 florian
- * a lot of small changes:
- - setlength is internal
- - win32 graph unit extended
- ....
- Revision 1.3 2000/08/08 22:12:36 sg
- * Implemented WideString helper functions (but they are not tested yet
- due to the lack of full compiler support for WideString/WideChar!)
- Revision 1.2 2000/07/13 11:33:46 michael
- + removed logs
- }
|