123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338 |
- {
- $Id$
- This file is part of the Free Pascal run time library.
- Copyright (c) 1999-2001 by Florian Klaempfl,
- member of the Free Pascal development team.
- This file implements support routines for WideStrings/Unicode with FPC
- See the file COPYING.FPC, included in this distribution,
- for details about the copyright.
- This program is distributed in the hope that it will be useful,
- but WITHOUT ANY WARRANTY; without even the implied warranty of
- MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
- **********************************************************************}
- {
- This file contains the implementation of the WideString type,
- and all things that are needed for it.
- WideString is defined as a 'silent' pwidechar :
- a pwidechar that points to :
- @-8 : SizeInt for reference count;
- @-4 : SizeInt for size;
- @ : String + Terminating #0;
- Pwidechar(Widestring) is a valid typecast.
- So WS[i] is converted to the address @WS+i-1.
- Constants should be assigned a reference count of -1
- Meaning that they can't be disposed of.
- }
- Type
- PWideRec = ^TWideRec;
- TWideRec = Packed Record
- Ref,
- Len : SizeInt;
- First : WideChar;
- end;
- Const
- WideRecLen = SizeOf(TWideRec);
- WideFirstOff = SizeOf(TWideRec)-sizeof(WideChar);
- {
- Default WideChar <-> Char conversion is to only convert the
- lower 127 chars, all others are translated to spaces.
- These routines can be overwritten for the Current Locale
- }
- procedure Wide2AnsiMove(source:pwidechar;dest:pchar;len:SizeInt);
- var
- i : SizeInt;
- begin
- for i:=1 to len do
- begin
- if word(source^)<128 then
- dest^:=char(word(source^))
- else
- dest^:=' ';
- inc(dest);
- inc(source);
- end;
- end;
- procedure Ansi2WideMove(source:pchar;dest:pwidechar;len:SizeInt);
- var
- i : SizeInt;
- begin
- for i:=1 to len do
- begin
- if byte(source^)<128 then
- dest^:=widechar(byte(source^))
- else
- dest^:=' ';
- inc(dest);
- inc(source);
- end;
- end;
- Const
- Wide2AnsiMoveProc:TWide2AnsiMove=@Wide2AnsiMove;
- Ansi2WideMoveProc:TAnsi2WideMove=@Ansi2WideMove;
- Procedure GetWideStringManager (Var Manager : TWideStringManager);
- begin
- Manager.Wide2AnsiMove:=Wide2AnsiMoveProc;
- Manager.Ansi2WideMove:=Ansi2WideMoveProc;
- end;
- Procedure SetWideStringManager (Const New : TWideStringManager; Var Old: TWideStringManager);
- begin
- GetWideStringManager(Old);
- SetWideStringManager(New);
- end;
- Procedure SetWideStringManager (Const New : TWideStringManager);
- begin
- Wide2AnsiMoveProc:=New.Wide2AnsiMove;
- Ansi2WideMoveProc:=New.Ansi2WideMove;
- end;
- (*
- Procedure UniqueWideString(Var S : WideString); [Public,Alias : 'FPC_WIDESTR_UNIQUE'];
- {
- Make sure reference count of S is 1,
- using copy-on-write semantics.
- }
- begin
- end;
- *)
- {****************************************************************************
- Internal functions, not in interface.
- ****************************************************************************}
- {$ifdef WideStrDebug}
- Procedure DumpWideRec(S : Pointer);
- begin
- If S=Nil then
- Writeln ('String is nil')
- Else
- Begin
- With PWideRec(S-WideFirstOff)^ do
- begin
- Write ('(Maxlen: ',maxlen);
- Write (' Len:',len);
- Writeln (' Ref: ',ref,')');
- end;
- end;
- end;
- {$endif}
- Function NewWideString(Len : SizeInt) : Pointer;
- {
- Allocate a new WideString on the heap.
- initialize it to zero length and reference count 1.
- }
- Var
- P : Pointer;
- begin
- GetMem(P,Len*sizeof(WideChar)+WideRecLen);
- If P<>Nil then
- begin
- PWideRec(P)^.Len:=0; { Initial length }
- PWideRec(P)^.Ref:=1; { Set reference count }
- PWideRec(P)^.First:=#0; { Terminating #0 }
- inc(p,WideFirstOff); { Points to string now }
- end;
- NewWideString:=P;
- end;
- Procedure DisposeWideString(Var S : Pointer);
- {
- Deallocates a WideString From the heap.
- }
- begin
- If S=Nil then
- exit;
- Dec (S,WideFirstOff);
- FreeMem (S);
- S:=Nil;
- end;
- Procedure fpc_WideStr_Decr_Ref (Var S : Pointer);saveregisters;[Public,Alias:'FPC_WIDESTR_DECR_REF']; {$ifdef hascompilerproc} compilerproc; {$endif}
- {
- Decreases the ReferenceCount of a non constant widestring;
- If the reference count is zero, deallocate the string;
- }
- Type
- pSizeInt = ^SizeInt;
- Var
- l : pSizeInt;
- Begin
- { Zero string }
- If S=Nil then exit;
- { check for constant strings ...}
- l:=@PWIDEREC(S-WideFirstOff)^.Ref;
- If l^<0 then exit;
- { declocked does a MT safe dec and returns true, if the counter is 0 }
- If declocked(l^) then
- { Ref count dropped to zero }
- DisposeWideString (S); { Remove...}
- {$ifndef decrrefnotnil}
- s:=nil;
- {$endif}
- end;
- {$ifdef hascompilerproc}
- { alias for internal use }
- Procedure fpc_WideStr_Decr_Ref (Var S : Pointer);saveregisters;[external name 'FPC_WIDESTR_DECR_REF'];
- {$endif compilerproc}
- {$ifdef hascompilerproc}
- Procedure fpc_WideStr_Incr_Ref (S : Pointer);saveregisters;[Public,Alias:'FPC_WIDESTR_INCR_REF']; {$ifdef hascompilerproc} compilerproc; {$endif}
- {$else}
- Procedure fpc_WideStr_Incr_Ref (Var S : Pointer);saveregisters;[Public,Alias:'FPC_WIDESTR_INCR_REF'];
- {$endif compilerproc}
- Begin
- If S=Nil then
- exit;
- { Let's be paranoid : Constant string ??}
- If PWideRec(S-WideFirstOff)^.Ref<0 then exit;
- inclocked(PWideRec(S-WideFirstOff)^.Ref);
- end;
- {$ifdef hascompilerproc}
- { alias for internal use }
- Procedure fpc_WideStr_Incr_Ref (S : Pointer);saveregisters;[external name 'FPC_WIDESTR_INCR_REF'];
- {$endif compilerproc}
- function fpc_WideStr_To_ShortStr (high_of_res: SizeInt;const S2 : WideString): shortstring;[Public, alias: 'FPC_WIDESTR_TO_SHORTSTR']; {$ifdef hascompilerproc} compilerproc; {$endif}
- {
- Converts a WideString to a ShortString;
- }
- Var
- Size : SizeInt;
- begin
- if S2='' then
- fpc_WideStr_To_ShortStr:=''
- else
- begin
- Size:=Length(S2);
- If Size>high_of_res then
- Size:=high_of_res;
- Wide2AnsiMoveProc(PWideChar(S2),PChar(@fpc_WideStr_To_ShortStr[1]),Size);
- byte(fpc_WideStr_To_ShortStr[0]):=byte(Size);
- end;
- end;
- Function fpc_ShortStr_To_WideStr (Const S2 : ShortString): WideString; {$ifdef hascompilerproc} compilerproc; {$endif}
- {
- Converts a ShortString to a WideString;
- }
- Var
- Size : SizeInt;
- begin
- Size:=Length(S2);
- Setlength (fpc_ShortStr_To_WideStr,Size);
- if Size>0 then
- begin
- Ansi2WideMoveProc(PChar(@S2[1]),PWideChar(Pointer(fpc_ShortStr_To_WideStr)),Size);
- { Terminating Zero }
- PWideChar(Pointer(fpc_ShortStr_To_WideStr)+Size*sizeof(WideChar))^:=#0;
- end;
- end;
- { old style helper }
- {$ifndef hascompilerproc}
- Procedure fpc_ShortStr_To_WideStr (Var S1 : Pointer; Const S2 : ShortString);[Public, alias: 'FPC_SHORTSTR_TO_WIDESTR'];
- begin
- s1 := pointer(fpc_ShortStr_To_WideStr(s2));
- end;
- {$endif hascompilerproc}
- Function fpc_WideStr_To_AnsiStr (const S2 : WideString): AnsiString; {$ifdef hascompilerproc} compilerproc; {$endif}
- {
- Converts a WideString to an AnsiString
- }
- Var
- Size : SizeInt;
- begin
- if s2='' then
- exit;
- Size:=Length(WideString(S2));
- Setlength (fpc_WideStr_To_AnsiStr,Size);
- if Size>0 then
- begin
- Wide2AnsiMoveProc(PWideChar(Pointer(S2)),PChar(Pointer(fpc_WideStr_To_AnsiStr)),Size);
- { Terminating Zero }
- PChar(Pointer(fpc_WideStr_To_AnsiStr)+Size)^:=#0;
- end;
- end;
- { old style helper }
- {$ifndef hascompilerproc}
- Procedure fpc_WideStr_To_AnsiStr (Var S1 : Pointer;const S2 : WideString);[Public, alias: 'FPC_WIDESTR_TO_ANSISTR'];
- begin
- s1 := pointer(fpc_WideStr_To_AnsiStr(s2));
- end;
- {$endif hascompilerproc}
- Function fpc_AnsiStr_To_WideStr (Const S2 : AnsiString): WideString; {$ifdef hascompilerproc} compilerproc; {$endif}
- {
- Converts an AnsiString to a WideString;
- }
- Var
- Size : SizeInt;
- begin
- if s2='' then
- exit;
- Size:=Length(S2);
- Setlength (result,Size);
- if Size>0 then
- begin
- Ansi2WideMoveProc(PChar(S2),PWideChar(Pointer(result)),Size);
- { Terminating Zero }
- PWideChar(Pointer(result)+Size*sizeof(WideChar))^:=#0;
- end;
- end;
- { compilers with widestrings should have compiler procs }
- Function fpc_PWideChar_To_AnsiStr(const p : pwidechar): ansistring; compilerproc;
- var
- Size : SizeInt;
- begin
- if p=nil then
- exit;
- Size := IndexWord(p^, -1, 0);
- Setlength (result,Size);
- if Size>0 then
- begin
- Wide2AnsiMoveProc(P,PChar(Pointer(result)),Size);
- { Terminating Zero }
- PChar(Pointer(result)+Size)^:=#0;
- end;
- end;
- Function fpc_PWideChar_To_WideStr(const p : pwidechar): widestring; compilerproc;
- var
- Size : SizeInt;
- begin
- if p=nil then
- exit;
- Size := IndexWord(p^, -1, 0);
- Setlength (result,Size);
- if Size>0 then
- begin
- Move(p^,PWideChar(Pointer(result))^,Size*sizeof(WideChar));
- { Terminating Zero }
- PWideChar(Pointer(result)+Size*sizeof(WideChar))^:=#0;
- end;
- end;
- Function fpc_PWideChar_To_ShortStr(const p : pwidechar): shortstring; compilerproc;
- var
- Size : SizeInt;
- begin
- if p=nil then
- begin
- fpc_PWideChar_To_ShortStr:='';
- exit;
- end;
- Size := IndexWord(p^, $7fffffff, 0);
- Setlength (result,Size+1);
- if Size>0 then
- begin
- If Size>255 then
- Size:=255;
- Wide2AnsiMoveProc(p,PChar(@result[1]),Size);
- byte(result[0]):=byte(Size);
- end;
- end;
- { old style helper }
- {$ifndef hascompilerproc}
- Procedure fpc_AnsiStr_To_WideStr (Var S1 : Pointer; Const S2 : AnsiString);[Public, alias: 'FPC_ANSISTR_TO_WIDESTR'];
- begin
- s1 := pointer(fpc_AnsiStr_To_WideStr(s2));
- end;
- {$endif hascompilerproc}
- { checked against the ansistring routine, 2001-05-27 (FK) }
- Procedure fpc_WideStr_Assign (Var S1 : Pointer;S2 : Pointer);[Public,Alias:'FPC_WIDESTR_ASSIGN']; {$ifdef hascompilerproc} compilerproc; {$endif}
- {
- Assigns S2 to S1 (S1:=S2), taking in account reference counts.
- }
- begin
- If S2<>nil then
- If PWideRec(S2-WideFirstOff)^.Ref>0 then
- Inc(PWideRec(S2-WideFirstOff)^.ref);
- { Decrease the reference count on the old S1 }
- fpc_widestr_decr_ref (S1);
- { And finally, have S1 pointing to S2 (or its copy) }
- S1:=S2;
- end;
- {$ifdef hascompilerproc}
- { alias for internal use }
- Procedure fpc_WideStr_Assign (Var S1 : Pointer;S2 : Pointer);[external name 'FPC_WIDESTR_ASSIGN'];
- {$endif hascompilerproc}
- { checked against the ansistring routine, 2001-05-27 (FK) }
- {$ifdef hascompilerproc}
- function fpc_WideStr_Concat (const S1,S2 : WideString): WideString; compilerproc;
- var
- S3: WideString absolute result;
- {$else hascompilerproc}
- Procedure fpc_WideStr_Concat (S1,S2 : WideString;var S3 : WideString);[Public, alias: 'FPC_WIDESTR_CONCAT'];
- {$endif hascompilerproc}
- {
- Concatenates 2 WideStrings : S1+S2.
- Result Goes to S3;
- }
- Var
- Size,Location : SizeInt;
- begin
- { only assign if s1 or s2 is empty }
- if (S1='') then
- S3 := S2
- else
- if (S2='') then
- S3 := S1
- else
- begin
- { create new result }
- Size:=Length(S2);
- Location:=Length(S1);
- SetLength (S3,Size+Location);
- Move (S1[1],S3[1],Location*sizeof(WideChar));
- Move (S2[1],S3[location+1],(Size+1)*sizeof(WideChar));
- end;
- end;
- Function fpc_Char_To_WideStr(const c : WideChar): WideString; {$ifdef hascompilerproc} compilerproc; {$endif}
- {
- Converts a Char to a WideString;
- }
- begin
- if c = #0 then
- { result is automatically set to '' }
- exit;
- Setlength (fpc_Char_To_WideStr,1);
- fpc_Char_To_WideStr[1]:=c;
- { Terminating Zero }
- PWideChar(Pointer(fpc_Char_To_WideStr)+sizeof(WideChar))^:=#0;
- end;
- { old style helper }
- {$ifndef hascompilerproc}
- Procedure fpc_Char_To_WideStr(var S1 : Pointer; c : WideChar);[Public, alias: 'FPC_CHAR_TO_WIDESTR'];
- begin
- s1 := pointer(fpc_Char_To_WideStr(c));
- end;
- {$endif hascompilerproc}
- Function fpc_PChar_To_WideStr(const p : pchar): WideString; {$ifdef hascompilerproc} compilerproc; {$endif}
- Var
- L : SizeInt;
- begin
- if (not assigned(p)) or (p[0]=#0) Then
- { result is automatically set to '' }
- exit;
- l:=IndexChar(p^,-1,#0);
- SetLength(fpc_PChar_To_WideStr,L);
- Ansi2WideMoveProc(P,PWideChar(Pointer(fpc_PChar_To_WideStr)),l);
- end;
- { old style helper }
- {$ifndef hascompilerproc}
- Procedure fpc_PChar_To_WideStr(var a : WideString;p : pchar);[Public,Alias : 'FPC_PCHAR_TO_WIDESTR']; {$ifdef hascompilerproc} compilerproc; {$endif}
- begin
- pointer(a) := pointer(fpc_PChar_To_WideStr(p));
- end;
- {$endif hascompilerproc}
- Function fpc_CharArray_To_WideStr(const arr: array of char): WideString; {$ifdef hascompilerproc} compilerproc; {$endif}
- var
- i : SizeInt;
- begin
- if arr[0]=#0 Then
- { result is automatically set to '' }
- exit;
- i:=IndexChar(arr,high(arr)+1,#0);
- if i = -1 then
- i := high(arr)+1;
- SetLength(fpc_CharArray_To_WideStr,i);
- Ansi2WideMoveProc (pchar(@arr),PWideChar(Pointer(fpc_CharArray_To_WideStr)),i);
- end;
- { old style helper }
- {$ifndef hascompilerproc}
- Procedure fpc_CharArray_To_WideStr(var a : WideString; p: pointer; len: SizeInt); [Public,Alias : 'FPC_CHARARRAY_TO_WIDESTR']; {$ifdef hascompilerproc} compilerproc; {$endif}
- var
- src: pchar;
- i: SizeInt;
- begin
- src := pchar(p);
- if src[0]=#0 Then
- begin
- pointer(a) := nil;
- exit;
- end;
- i:=IndexChar(src^,len,#0);
- if i = -1 then
- i := len;
- pointer(a) := NewWideString(i);
- Ansi2WideMoveProc (src,PWideChar(Pointer(@a[1])),i);
- end;
- {$endif not hascompilerproc}
- {$ifdef hascompilerproc}
- { inside the compiler, the resulttype is modified to that of the actual }
- { chararray we're converting to (JM) }
- function fpc_widestr_to_chararray(arraysize: SizeInt; const src: WideString): fpc_big_chararray;[public,alias: 'FPC_WIDESTR_TO_CHARARRAY']; compilerproc;
- var
- len: SizeInt;
- begin
- len := length(src);
- if len > arraysize then
- len := arraysize;
- { make sure we don't dereference src if it can be nil (JM) }
- if len > 0 then
- wide2ansimoveproc(pwidechar(@src[1]),pchar(@fpc_widestr_to_chararray[0]),len);
- fillchar(fpc_widestr_to_chararray[len],arraysize-len,0);
- end;
- {$endif hascompilerproc}
- Function fpc_WideStr_Compare(const S1,S2 : WideString): SizeInt;[Public,Alias : 'FPC_WIDESTR_COMPARE']; {$ifdef hascompilerproc} compilerproc; {$endif}
- {
- Compares 2 WideStrings;
- The result is
- <0 if S1<S2
- 0 if S1=S2
- >0 if S1>S2
- }
- Var
- MaxI,Temp : SizeInt;
- begin
- if pointer(S1)=pointer(S2) then
- begin
- fpc_WideStr_Compare:=0;
- exit;
- end;
- Maxi:=Length(S1);
- temp:=Length(S2);
- If MaxI>Temp then
- MaxI:=Temp;
- Temp:=CompareWord(S1[1],S2[1],MaxI);
- if temp=0 then
- temp:=Length(S1)-Length(S2);
- fpc_WideStr_Compare:=Temp;
- end;
- Procedure fpc_WideStr_CheckZero(p : pointer);[Public,Alias : 'FPC_WIDESTR_CHECKZERO']; {$ifdef hascompilerproc} compilerproc; {$endif}
- begin
- if p=nil then
- HandleErrorFrame(201,get_frame);
- end;
- Procedure fpc_WideStr_CheckRange(len,index : SizeInt);[Public,Alias : 'FPC_WIDESTR_RANGECHECK']; {$ifdef hascompilerproc} compilerproc; {$endif}
- begin
- if (index>len) or (Index<1) then
- HandleErrorFrame(201,get_frame);
- end;
- {$ifndef INTERNSETLENGTH}
- Procedure SetLength (Var S : WideString; l : SizeInt);
- {$else INTERNSETLENGTH}
- Procedure fpc_WideStr_SetLength (Var S : WideString; l : SizeInt);[Public,Alias : 'FPC_WIDESTR_SETLENGTH']; {$ifdef hascompilerproc} compilerproc; {$endif}
- {$endif INTERNSETLENGTH}
- {
- Sets The length of string S to L.
- Makes sure S is unique, and contains enough room.
- }
- Var
- Temp : Pointer;
- movelen: SizeInt;
- begin
- if (l>0) then
- begin
- if Pointer(S)=nil then
- begin
- { Need a complete new string...}
- Pointer(s):=NewWideString(l);
- end
- else if (PWideRec(Pointer(S)-WideFirstOff)^.Ref = 1) then
- begin
- Dec(Pointer(S),WideFirstOff);
- if L*sizeof(WideChar)+WideRecLen>MemSize(Pointer(S)) then
- reallocmem(pointer(S), L*sizeof(WideChar)+WideRecLen);
- Inc(Pointer(S), WideFirstOff);
- end
- else
- begin
- { Reallocation is needed... }
- Temp:=Pointer(NewWideString(L));
- if Length(S)>0 then
- begin
- if l < succ(length(s)) then
- movelen := l
- { also move terminating null }
- else movelen := succ(length(s));
- Move(Pointer(S)^,Temp^,movelen * Sizeof(WideChar));
- end;
- fpc_widestr_decr_ref(Pointer(S));
- Pointer(S):=Temp;
- end;
- { Force nil termination in case it gets shorter }
- PWord(Pointer(S)+l*sizeof(WideChar))^:=0;
- PWideRec(Pointer(S)-FirstOff)^.Len:=l;
- end
- else
- begin
- { Length=0 }
- if Pointer(S)<>nil then
- fpc_widestr_decr_ref (Pointer(S));
- Pointer(S):=Nil;
- end;
- end;
- {*****************************************************************************
- Public functions, In interface.
- *****************************************************************************}
- function WideCharToString(S : PWideChar) : AnsiString;
- begin
- result:=WideCharLenToString(s,Length(WideString(s)));
- end;
- function StringToWideChar(const Src : AnsiString;Dest : PWideChar;DestSize : SizeInt) : PWideChar;
- begin
- if Length(Src)<DestSize then
- Ansi2WideMoveProc(PChar(Src),Dest,Length(Src))
- else
- Ansi2WideMoveProc(PChar(Src),Dest,DestSize);
- result:=Dest;
- end;
- function WideCharLenToString(S : PWideChar;Len : SizeInt) : AnsiString;
- begin
- SetLength(result,Len);
- Wide2AnsiMove(S,PChar(result),Len);
- end;
- procedure WideCharLenToStrVar(Src : PWideChar;Len : SizeInt;var Dest : AnsiString);
- begin
- Dest:=WideCharLenToString(Src,Len);
- end;
- procedure WideCharToStrVar(S : PWideChar;var Dest : AnsiString);
- begin
- Dest:=WideCharToString(S);
- end;
- {$ifndef INTERNLENGTH}
- Function Length (Const S : WideString) : SizeInt;
- {
- Returns the length of an WideString.
- Takes in acount that zero strings are NIL;
- }
- begin
- If Pointer(S)=Nil then
- Length:=0
- else
- Length:=PWideRec(Pointer(S)-WideFirstOff)^.Len;
- end;
- {$endif INTERNLENGTH}
- { overloaded version of UniqueString for interface }
- procedure UniqueString(Var S : WideString); [external name 'FPC_WIDESTR_UNIQUE'];
- Function fpc_widestr_Unique(Var S : Pointer): Pointer; [Public,Alias : 'FPC_WIDESTR_UNIQUE']; {$ifdef hascompilerproc} compilerproc; {$endif}
- {
- Make sure reference count of S is 1,
- using copy-on-write semantics.
- }
- Var
- SNew : Pointer;
- L : SizeInt;
- begin
- pointer(result) := pointer(s);
- If Pointer(S)=Nil then
- exit;
- if PWideRec(Pointer(S)-WideFirstOff)^.Ref<>1 then
- begin
- L:=PWideRec(Pointer(S)-WideFirstOff)^.len;
- SNew:=NewWideString (L);
- Move (PWideChar(S)^,SNew^,(L+1)*sizeof(WideChar));
- PWideRec(SNew-WideFirstOff)^.len:=L;
- fpc_widestr_decr_ref (Pointer(S)); { Thread safe }
- pointer(S):=SNew;
- pointer(result):=SNew;
- end;
- end;
- {$ifdef interncopy}
- Function Fpc_WideStr_Copy (Const S : WideString; Index,Size : SizeInt) : WideString;compilerproc;
- {$else}
- Function Copy (Const S : WideString; Index,Size : SizeInt) : WideString;
- {$endif}
- var
- ResultAddress : Pointer;
- begin
- ResultAddress:=Nil;
- dec(index);
- if Index < 0 then
- Index := 0;
- { Check Size. Accounts for Zero-length S, the double check is needed because
- Size can be maxint and will get <0 when adding index }
- if (Size>Length(S)) or
- (Index+Size>Length(S)) then
- Size:=Length(S)-Index;
- If Size>0 then
- begin
- If Index<0 Then
- Index:=0;
- ResultAddress:=Pointer(NewWideString (Size));
- if ResultAddress<>Nil then
- begin
- Move (PWideChar(S)[Index],ResultAddress^,Size*sizeof(WideChar));
- PWideRec(ResultAddress-WideFirstOff)^.Len:=Size;
- PWideChar(ResultAddress+Size*sizeof(WideChar))^:=#0;
- end;
- end;
- {$ifdef interncopy}
- Pointer(fpc_widestr_Copy):=ResultAddress;
- {$else}
- Pointer(Copy):=ResultAddress;
- {$endif}
- end;
- Function Pos (Const Substr : WideString; Const Source : WideString) : SizeInt;
- var
- i,MaxLen : SizeInt;
- pc : pwidechar;
- begin
- Pos:=0;
- if Length(SubStr)>0 then
- begin
- MaxLen:=Length(source)-Length(SubStr);
- i:=0;
- pc:=@source[1];
- while (i<=MaxLen) do
- begin
- inc(i);
- if (SubStr[1]=pc^) and
- (CompareWord(Substr[1],pc^,Length(SubStr))=0) then
- begin
- Pos:=i;
- exit;
- end;
- inc(pc);
- end;
- end;
- end;
- { Faster version for a widechar alone }
- Function Pos (c : WideChar; Const s : WideString) : SizeInt;
- var
- i: SizeInt;
- pc : pwidechar;
- begin
- pc:=@s[1];
- for i:=1 to length(s) do
- begin
- if pc^=c then
- begin
- pos:=i;
- exit;
- end;
- inc(pc);
- end;
- pos:=0;
- end;
- { Faster version for a char alone. Must be implemented because }
- { pos(c: char; const s: shortstring) also exists, so otherwise }
- { using pos(char,pchar) will always call the shortstring version }
- { (exact match for first argument), also with $h+ (JM) }
- Function Pos (c : Char; Const s : WideString) : SizeInt;
- var
- i: SizeInt;
- wc : widechar;
- pc : pwidechar;
- begin
- wc:=c;
- pc:=@s[1];
- for i:=1 to length(s) do
- begin
- if pc^=wc then
- begin
- pos:=i;
- exit;
- end;
- inc(pc);
- end;
- pos:=0;
- end;
- Procedure Delete (Var S : WideString; Index,Size: SizeInt);
- Var
- LS : SizeInt;
- begin
- If Length(S)=0 then
- exit;
- if index<=0 then
- exit;
- LS:=PWideRec(Pointer(S)-WideFirstOff)^.Len;
- if (Index<=LS) and (Size>0) then
- begin
- UniqueString (S);
- if Size+Index>LS then
- Size:=LS-Index+1;
- if Index+Size<=LS then
- begin
- Dec(Index);
- Move(PWideChar(S)[Index+Size],PWideChar(S)[Index],(LS-Index+1)*sizeof(WideChar));
- end;
- Setlength(s,LS-Size);
- end;
- end;
- Procedure Insert (Const Source : WideString; Var S : WideString; Index : SizeInt);
- var
- Temp : WideString;
- LS : SizeInt;
- begin
- If Length(Source)=0 then
- exit;
- if index <= 0 then
- index := 1;
- Ls:=Length(S);
- if index > LS then
- index := LS+1;
- Dec(Index);
- Pointer(Temp) := NewWideString(Length(Source)+LS);
- SetLength(Temp,Length(Source)+LS);
- If Index>0 then
- move (PWideChar(S)^,PWideChar(Temp)^,Index*sizeof(WideChar));
- Move (PWideChar(Source)^,PWideChar(Temp)[Index],Length(Source)*sizeof(WideChar));
- If (LS-Index)>0 then
- Move(PWideChar(S)[Index],PWideChar(temp)[Length(Source)+index],(LS-Index)*sizeof(WideChar));
- S:=Temp;
- end;
- Procedure SetString (Var S : WideString; Buf : PWideChar; Len : SizeInt);
- var
- BufLen: SizeInt;
- begin
- SetLength(S,Len);
- If (Buf<>Nil) and (Len>0) then
- begin
- BufLen := IndexWord(Buf^, Len+1, 0);
- If (BufLen>0) and (BufLen < Len) then
- Len := BufLen;
- Move (Buf[0],S[1],Len*sizeof(WideChar));
- PWideChar(Pointer(S)+Len*sizeof(WideChar))^:=#0;
- end;
- end;
- Procedure SetString (Var S : WideString; Buf : PChar; Len : SizeInt);
- var
- BufLen: SizeInt;
- begin
- SetLength(S,Len);
- If (Buf<>Nil) and (Len>0) then
- begin
- BufLen := IndexByte(Buf^, Len+1, 0);
- If (BufLen>0) and (BufLen < Len) then
- Len := BufLen;
- Ansi2WideMoveProc(Buf,PWideChar(S),Len);
- PWideChar(Pointer(S)+Len*sizeof(WideChar))^:=#0;
- end;
- end;
- Function fpc_Val_Real_WideStr(Const S : WideString; Var Code : ValSInt): ValReal; [public, alias:'FPC_VAL_REAL_WIDESTR']; {$ifdef hascompilerproc} compilerproc; {$endif}
- Var
- SS : String;
- begin
- fpc_Val_Real_WideStr := 0;
- if length(S) > 255 then
- code := 256
- else
- begin
- SS := S;
- Val(SS,fpc_Val_Real_WideStr,code);
- end;
- end;
- Function fpc_Val_UInt_WideStr (Const S : WideString; Var Code : ValSInt): ValUInt; [public, alias:'FPC_VAL_UINT_WIDESTR']; {$ifdef hascompilerproc} compilerproc; {$endif}
- Var
- SS : ShortString;
- begin
- fpc_Val_UInt_WideStr := 0;
- if length(S) > 255 then
- code := 256
- else
- begin
- SS := S;
- Val(SS,fpc_Val_UInt_WideStr,code);
- end;
- end;
- Function fpc_Val_SInt_WideStr (DestSize: SizeInt; Const S : WideString; Var Code : ValSInt): ValSInt; [public, alias:'FPC_VAL_SINT_WIDESTR']; {$ifdef hascompilerproc} compilerproc; {$endif}
- Var
- SS : ShortString;
- begin
- fpc_Val_SInt_WideStr:=0;
- if length(S)>255 then
- code:=256
- else
- begin
- SS := S;
- fpc_Val_SInt_WideStr := fpc_Val_SInt_ShortStr(DestSize,SS,Code);
- end;
- end;
- {$ifndef CPU64}
- Function fpc_Val_qword_WideStr (Const S : WideString; Var Code : ValSInt): qword; [public, alias:'FPC_VAL_QWORD_WIDESTR']; {$ifdef hascompilerproc} compilerproc; {$endif}
- Var
- SS : ShortString;
- begin
- fpc_Val_qword_WideStr:=0;
- if length(S)>255 then
- code:=256
- else
- begin
- SS := S;
- Val(SS,fpc_Val_qword_WideStr,Code);
- end;
- end;
- Function fpc_Val_int64_WideStr (Const S : WideString; Var Code : ValSInt): Int64; [public, alias:'FPC_VAL_INT64_WIDESTR']; {$ifdef hascompilerproc} compilerproc; {$endif}
- Var
- SS : ShortString;
- begin
- fpc_Val_int64_WideStr:=0;
- if length(S)>255 then
- code:=256
- else
- begin
- SS := S;
- Val(SS,fpc_Val_int64_WideStr,Code);
- end;
- end;
- {$endif CPU64}
- procedure fpc_WideStr_Float(d : ValReal;len,fr,rt : SizeInt;var s : WideString);{$ifdef hascompilerproc} compilerproc; {$endif}
- var
- ss : shortstring;
- begin
- str_real(len,fr,d,treal_type(rt),ss);
- s:=ss;
- end;
- {$ifdef STR_USES_VALINT}
- Procedure fpc_WideStr_SInt(v : ValSint; Len : SizeInt; Var S : WideString);{$ifdef hascompilerproc} compilerproc; {$endif}
- {$else}
- Procedure fpc_WideStr_Longint(v : Longint; Len : SizeInt; Var S : WideString);{$ifdef hascompilerproc} compilerproc; {$endif}
- {$endif}
- Var
- SS : ShortString;
- begin
- Str (v:Len,SS);
- S:=SS;
- end;
- {$ifdef STR_USES_VALINT}
- Procedure fpc_WideStr_UInt(v : ValUInt;Len : SizeInt; Var S : WideString);{$ifdef hascompilerproc} compilerproc; {$endif}
- {$else}
- Procedure fpc_WideStr_Longword(v : Longword;Len : SizeInt; Var S : WideString);{$ifdef hascompilerproc} compilerproc; {$endif}
- {$endif}
- Var
- SS : ShortString;
- begin
- str(v:Len,SS);
- S:=SS;
- end;
- {$ifndef CPU64}
- Procedure fpc_WideStr_Int64(v : Int64; Len : SizeInt; Var S : WideString);{$ifdef hascompilerproc} compilerproc; {$endif}
- Var
- SS : ShortString;
- begin
- Str (v:Len,SS);
- S:=SS;
- end;
- Procedure fpc_WideStr_Qword(v : Qword;Len : SizeInt; Var S : WideString);{$ifdef hascompilerproc} compilerproc; {$endif}
- Var
- SS : ShortString;
- begin
- str(v:Len,SS);
- S:=SS;
- end;
- {$endif CPU64}
- function UnicodeToUtf8(Dest: PChar; Source: PWideChar; MaxBytes: SizeInt): SizeInt;{$ifdef SYSTEMINLINE}inline;{$endif}
- begin
- if assigned(Source) then
- Result:=UnicodeToUtf8(Dest,MaxBytes,Source,IndexWord(Source^,-1,0))
- else
- Result:=0;
- end;
- function UnicodeToUtf8(Dest: PChar; MaxDestBytes: SizeUInt; Source: PWideChar; SourceChars: SizeUInt): SizeUInt;
- var
- i,j : SizeUInt;
- w : word;
- begin
- result:=0;
- if source=nil then
- exit;
- i:=0;
- j:=0;
- if assigned(Dest) then
- begin
- while (i<SourceChars) and (j<MaxDestBytes) do
- begin
- w:=word(Source[i]);
- case w of
- 0..$7f:
- begin
- Dest[j]:=char(w);
- inc(j);
- end;
- $80..$7ff:
- begin
- if j+1>=MaxDestBytes then
- break;
- Dest[j]:=char($c0 or (w shr 6));
- Dest[j+1]:=char($80 or (w and $3f));
- inc(j,2);
- end;
- else
- begin
- if j+2>=MaxDestBytes then
- break;
- Dest[j]:=char($e0 or (w shr 12));
- Dest[j+1]:=char($80 or ((w shr 6)and $3f));
- Dest[j+2]:=char($80 or (w and $3f));
- inc(j,3);
- end;
- end;
- inc(i);
- end;
- if j>MaxDestBytes-1 then
- j:=MaxDestBytes-1;
- Dest[j]:=#0;
- end
- else
- begin
- while i<SourceChars do
- begin
- case word(Source[i]) of
- $0..$7f:
- inc(j);
- $80..$7ff:
- inc(j,2);
- else
- inc(j,3);
- end;
- end;
- end;
- result:=j+1;
- end;
- function Utf8ToUnicode(Dest: PWideChar; Source: PChar; MaxChars: SizeInt): SizeInt;{$ifdef SYSTEMINLINE}inline;{$endif}
- begin
- if assigned(Source) then
- Result:=Utf8ToUnicode(Dest,MaxChars,Source,strlen(Source))
- else
- Result:=0;
- end;
- function Utf8ToUnicode(Dest: PWideChar; MaxDestChars: SizeUInt; Source: PChar; SourceBytes: SizeUInt): SizeUInt;
- var
- i,j : SizeUInt;
- w : word;
- b : byte;
- begin
- result:=0;
- i:=0;
- j:=0;
- if assigned(Dest) then
- begin
- while (j<MaxDestChars) and (i<SourceBytes) do
- begin
- b:=byte(Source[i]);
- inc(i);
- // 2 or 3 bytes?
- if b>=$80 then
- begin
- w:=b and $3c;
- if i>=SourceBytes then
- exit;
- // 3 bytes?
- if (b and $20)<>0 then
- begin
- b:=byte(Source[i]);
- inc(i);
- if i>=SourceBytes then
- exit;
- if (b and $c0)<>$80 then
- exit;
- w:=(w shl 6) or (b and $3c);
- end;
- b:=byte(Source[i]);
- w:=(w shl 6) or (b and $3c);
- if (b and $c0)<>$80 then
- exit;
- inc(i);
- end;
- Dest[j]:=WideChar(w);
- inc(j);
- end;
- end
- else
- begin
- while i<SourceBytes do
- begin
- b:=byte(Source[i]);
- inc(i);
- // 2 or 3 bytes?
- if b>=$80 then
- begin
- if i>=SourceBytes then
- exit;
- // 3 bytes?
- if (b and $20)<>0 then
- begin
- b:=byte(Source[i]);
- inc(i);
- if i>=SourceBytes then
- exit;
- if (b and $c0)<>$80 then
- exit;
- end;
- if (byte(Source[i]) and $c0)<>$80 then
- exit;
- inc(i);
- end;
- inc(j);
- end;
- end;
- result:=j+1;
- end;
- function UTF8Encode(const s : WideString) : UTF8String;
- var
- i : SizeInt;
- hs : UTF8String;
- begin
- result:='';
- if s='' then
- exit;
- SetLength(hs,length(s)*3);
- i:=UnicodeToUtf8(pchar(hs),length(hs)+1,PWideChar(s),length(s));
- if i>0 then
- begin
- SetLength(hs,i-1);
- result:=hs;
- end;
- end;
- function UTF8Decode(const s : UTF8String): WideString;
- var
- i : SizeInt;
- hs : WideString;
- begin
- result:='';
- if s='' then
- exit;
- SetLength(hs,length(s));
- i:=Utf8ToUnicode(PWideChar(hs),length(hs)+1,pchar(s),length(s));
- if i>0 then
- begin
- SetLength(hs,i-1);
- result:=hs;
- end;
- end;
- function AnsiToUtf8(const s : ansistring): UTF8String;{$ifdef SYSTEMINLINE}inline;{$endif}
- begin
- Result:=Utf8Encode(s);
- end;
- function Utf8ToAnsi(const s : UTF8String) : ansistring;{$ifdef SYSTEMINLINE}inline;{$endif}
- begin
- Result:=Utf8Decode(s);
- end;
- {
- $Log$
- Revision 1.44 2004-09-29 14:55:49 mazen
- * widestring conversion routines takes a widechar so no
- information is lost
- Revision 1.43 2004/09/18 10:23:08 jonas
- - removed unused local variable
- * fixed bug in Utf8ToUnicode (use of uninitialised variable)
- Revision 1.42 2004/07/18 20:21:44 florian
- + several unicode (to/from utf-8 conversion) stuff added
- * some longint -> SizeInt changes
- Revision 1.41 2004/07/12 17:58:19 peter
- * remove maxlen field from ansistring/widestrings
- Revision 1.40 2004/07/02 21:21:09 peter
- * decr ref doesn't reset pointer
- * finalize resets pointer for astring,wstring
- Revision 1.39 2004/05/31 14:31:57 peter
- * remove comment warnings
- Revision 1.38 2004/05/29 15:39:08 florian
- * the decr functions set the data now to nil
- Revision 1.37 2004/05/01 23:55:18 peter
- * replace strlenint with sizeint
- Revision 1.36 2004/04/29 18:59:43 peter
- * str() helpers now also use valint/valuint
- * int64/qword helpers disabled for cpu64
- Revision 1.35 2004/01/22 22:09:05 peter
- * finalize needs to reset to nil after decr_ref
- Revision 1.34 2003/11/29 17:27:05 michael
- + Added overloaded version of SetWideStringManager without old parameter
- Revision 1.33 2003/11/28 20:36:13 michael
- + Added WideStringManager
- Revision 1.32 2003/11/05 15:33:51 florian
- * made Index* usage consistent with astrings.inc
- Revision 1.31 2003/06/17 19:24:08 jonas
- * fixed conversion of fpc_*str_unique to compilerproc
- Revision 1.30 2003/06/17 16:38:53 jonas
- * fpc_ansistr|widestr_unique is now a function so it can be used as
- compilerproc
- Revision 1.29 2003/05/01 08:05:23 florian
- * started to make the rtl 64 bit save by introducing SizeInt and SizeUInt (similar to size_t of C)
- Revision 1.28 2002/12/29 16:59:17 peter
- * implemented some more conversions
- Revision 1.27 2002/12/15 22:33:12 peter
- * SetString(WideString,[PChar|PWideChar],Len) added
- Revision 1.26 2002/12/14 19:16:45 sg
- * Ported improvements from the AnsiString equivalents to NewWideString and
- fpc_WideStr_SetLength
- Revision 1.25 2002/12/07 14:35:34 carl
- - avoid warnings (add typecast)
- Revision 1.24 2002/10/10 16:08:50 florian
- + several widestring/pwidechar related helpers added
- Revision 1.23 2002/10/02 18:21:52 peter
- * Copy() changed to internal function calling compilerprocs
- * FPC_SHORTSTR_COPY renamed to FPC_SHORTSTR_ASSIGN because of the
- new copy functions
- Revision 1.22 2002/09/26 21:50:38 florian
- + some WideString<->AnsiString conversion functions added
- Revision 1.21 2002/09/14 11:20:50 carl
- * Delphi compatibility fix (with string routines)
- Revision 1.20 2002/09/07 21:16:45 carl
- * cardinal -> longword
- Revision 1.19 2002/09/07 15:07:46 peter
- * old logs removed and tabs fixed
- Revision 1.18 2002/07/29 21:28:17 florian
- * several fixes to get further with linux/ppc system unit compilation
- Revision 1.17 2002/04/26 15:19:05 peter
- * use saveregisters for incr routines, saves also problems with
- the optimizer
- Revision 1.16 2002/04/25 20:14:57 peter
- * updated compilerprocs
- * incr ref count has now a value argument instead of var
- }
|