1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876187718781879188018811882188318841885188618871888188918901891189218931894189518961897189818991900190119021903190419051906190719081909191019111912191319141915191619171918191919201921192219231924192519261927192819291930193119321933193419351936193719381939194019411942194319441945194619471948194919501951195219531954195519561957195819591960196119621963196419651966196719681969197019711972197319741975197619771978197919801981198219831984198519861987198819891990199119921993199419951996199719981999200020012002200320042005200620072008200920102011201220132014201520162017201820192020202120222023202420252026202720282029203020312032203320342035203620372038203920402041204220432044204520462047204820492050205120522053205420552056205720582059206020612062206320642065206620672068206920702071207220732074207520762077207820792080208120822083208420852086208720882089209020912092209320942095209620972098209921002101210221032104210521062107210821092110211121122113211421152116211721182119212021212122212321242125212621272128212921302131213221332134213521362137213821392140214121422143214421452146214721482149215021512152215321542155215621572158215921602161216221632164216521662167216821692170217121722173217421752176217721782179218021812182218321842185218621872188218921902191219221932194219521962197219821992200220122022203220422052206220722082209221022112212221322142215221622172218221922202221222222232224222522262227222822292230223122322233223422352236223722382239224022412242224322442245224622472248224922502251225222532254225522562257225822592260226122622263226422652266226722682269227022712272227322742275227622772278227922802281228222832284228522862287228822892290229122922293229422952296229722982299230023012302230323042305230623072308230923102311231223132314231523162317231823192320232123222323232423252326232723282329233023312332233323342335233623372338233923402341234223432344234523462347234823492350235123522353235423552356235723582359236023612362236323642365236623672368236923702371237223732374237523762377237823792380238123822383238423852386238723882389239023912392239323942395239623972398239924002401240224032404240524062407240824092410241124122413241424152416241724182419242024212422242324242425242624272428242924302431243224332434243524362437243824392440244124422443244424452446244724482449245024512452245324542455245624572458245924602461246224632464246524662467246824692470 |
- {
- This file is part of the Free Pascal run time library.
- Copyright (c) 1999-2005 by Florian Klaempfl,
- member of the Free Pascal development team.
- This file implements support routines for UTF-8 strings with FPC
- See the file COPYING.FPC, included in this distribution,
- for details about the copyright.
- This program is distributed in the hope that it will be useful,
- but WITHOUT ANY WARRANTY; without even the implied warranty of
- MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
- **********************************************************************}
- {$ifndef FPC_UNICODESTRING_TYPE_DEFINED}
- {$define FPC_UNICODESTRING_TYPE_DEFINED}
- {
- This file contains the implementation of the UnicodeString type,
- and all things that are needed for it.
- UnicodeString is defined as a 'silent' punicodechar :
- a punicodechar that points to (S= SizeOf(SizeInt), R= (if CPU64 then SizeOf(Longint) else SizeOf(SizeInt))):
- @-S-R : Reference count (R bytes)
- @-S : SizeInt for size; size=number of chars. Multiply with
- sizeof(UnicodeChar) to get the number of bytes. This is compatible with Delphi.
- @ : String + Terminating #0;
- Punicodechar(Unicodestring) is a valid typecast.
- So WS[i] is converted to the address @WS+i-1.
- Constants should be assigned a reference count of -1
- Meaning that they can't be disposed of.
- }
- Type
- PUnicodeRec = ^TUnicodeRec;
- TUnicodeRec = Record
- CodePage : TSystemCodePage;
- ElementSize : Word;
- {$if not defined(VER3_0) and not defined(VER3_2)}
- {$ifdef CPU64}
- Ref : Longint;
- {$else}
- Ref : SizeInt;
- {$endif}
- {$else}
- {$ifdef CPU64}
- { align fields }
- Dummy : DWord;
- {$endif CPU64}
- Ref : SizeInt;
- {$endif}
- Len : SizeInt;
- end;
- Const
- UnicodeFirstOff = SizeOf(TUnicodeRec);
- {$endif FPC_UNICODESTRING_TYPE_DEFINED}
- {
- Default UnicodeChar <-> AnsiChar conversion is to only convert the
- lower 127 chars, all others are translated to '?'.
- These routines can be overridden for the Current Locale
- }
- {$ifndef FPC_HAS_DEFAULT_UNICODE_2_ANSI_MOVE}
- {$define FPC_HAS_DEFAULT_UNICODE_2_ANSI_MOVE}
- procedure DefaultUnicode2AnsiMove(source:punicodechar;var dest:RawByteString;cp : TSystemCodePage;len:SizeInt);
- var
- i : SizeInt;
- p : PAnsiChar;
- begin
- setlength(dest,len);
- if not assigned(pointer(dest)) then
- exit;
- SetCodePage(dest,cp,false);
- p:=pointer(dest); {SetLength guarantees that dest is unique}
- for i:=1 to len do
- begin
- if word(source^)<256 then
- p^:=AnsiChar(word(source^))
- else
- p^:='?';
- inc(source);
- inc(p);
- end;
- end;
- {$endif FPC_HAS_DEFAULT_UNICODE_2_ANSI_MOVE}
- {$ifndef FPC_HAS_DEFAULT_ANSI_2_UNICODE}
- {$define FPC_HAS_DEFAULT_ANSI_2_UNICODE}
- procedure DefaultAnsi2UnicodeMove(source:pansichar;cp : TSystemCodePage;var dest:unicodestring;len:SizeInt);
- var
- i : SizeInt;
- p : PUnicodeChar;
- begin
- setlength(dest,len);
- p:=pointer(dest); {SetLength guarantees that dest is unique}
- for i:=1 to len do
- begin
- p^:=unicodechar(byte(source^));
- inc(source);
- inc(p);
- end;
- end;
- {$endif FPC_HAS_DEFAULT_ANSI_2_UNICODE}
- {$ifndef FPC_HAS_BUILTIN_WIDESTR_MANAGER}
- function DefaultCharLengthPChar(const Str: PAnsiChar): PtrInt;
- begin
- DefaultCharLengthPChar:=length(Str);
- end;
- function DefaultCodePointLength(const Str: PAnsiChar; MaxLookAead: PtrInt): Ptrint;
- begin
- if str[0]<>#0 then
- DefaultCodePointLength:=1
- else
- DefaultCodePointLength:=0;
- end;
- {$endif FPC_HAS_BUILTIN_WIDESTR_MANAGER}
- function DefaultGetStandardCodePage(const stdcp: TStandardCodePageEnum): TSystemCodePage;
- begin
- { don't raise an exception here. We need this for text file handling }
- if stdcp<>scpFileSystemSingleByte then
- Result:=DefaultSystemCodePage
- else
- { we could return UTF-8 here in case of FPCRTL_FILESYSTEM_UTF8, but
- without a fully functional widestring manager that will probably cause
- more problems that it solves }
- Result:=DefaultFileSystemCodePage
- end;
- Procedure GetUnicodeStringManager (Out Manager : TUnicodeStringManager);
- begin
- manager:=widestringmanager;
- end;
- Procedure SetUnicodeStringManager (Const New : TUnicodeStringManager; Out Old: TUnicodeStringManager);
- begin
- Old:=widestringmanager;
- widestringmanager:=New;
- end;
- Procedure SetUnicodeStringManager (Const New : TUnicodeStringManager);
- begin
- widestringmanager:=New;
- end;
- Procedure GetWideStringManager (out Manager : TUnicodeStringManager);
- begin
- manager:=widestringmanager;
- end;
- Procedure SetWideStringManager (Const New : TUnicodeStringManager; Out old: TUnicodeStringManager);
- begin
- Old:=widestringmanager;
- widestringmanager:=New;
- end;
- Procedure SetWideStringManager (Const New : TUnicodeStringManager);
- begin
- widestringmanager:=New;
- end;
- {****************************************************************************
- Internal functions, not in interface.
- ****************************************************************************}
- procedure UnicodeStringError;
- begin
- HandleErrorAddrFrameInd(204,get_pc_addr,get_frame);
- end;
- {$ifndef FPC_HAS_NEW_UNICODESTRING}
- {$define FPC_HAS_NEW_UNICODESTRING}
- Function NewUnicodeString(Len : SizeInt) : Pointer;
- {
- Allocate a new UnicodeString on the heap.
- initialize it to zero length and reference count 1.
- }
- begin
- Result:=GetMem(Len*sizeof(UnicodeChar)+(UnicodeFirstOff+sizeof(UnicodeChar)));
- If Result=Nil then
- UnicodeStringError;
- PUnicodeRec(Result)^.Len:=Len; { Initial length }
- PUnicodeRec(Result)^.Ref:=1; { Initial Refcount }
- PUnicodeRec(Result)^.CodePage:=DefaultUnicodeCodePage;
- PUnicodeRec(Result)^.ElementSize:=SizeOf(UnicodeChar);
- inc(Result,UnicodeFirstOff); { Points to string now }
- PUnicodeChar(Result)^:=#0; { Terminating #0 }
- end;
- {$endif FPC_HAS_NEW_UNICODESTRING}
- {$ifndef FPC_HAS_UNICODESTR_DECR_REF}
- {$define FPC_HAS_UNICODESTR_DECR_REF}
- Procedure fpc_UnicodeStr_Decr_Ref (Var S : Pointer);[Public,Alias:'FPC_UNICODESTR_DECR_REF']; compilerproc;
- {
- Decreases the ReferenceCount of a non constant unicodestring;
- If the reference count is zero, deallocate the string;
- }
- Var
- p: PUnicodeRec;
- Begin
- { Zero string }
- if S=Nil then
- exit;
- { check for constant strings ...}
- p:=PUnicodeRec(S-UnicodeFirstOff);
- S:=nil;
- if p^.Ref<0 then
- exit;
- { declocked does a MT safe dec and returns true, if the counter is 0 }
- if declocked(p^.Ref) then
- FreeMem(p);
- end;
- { alias for internal use }
- Procedure fpc_UnicodeStr_Decr_Ref (Var S : Pointer);[external name 'FPC_UNICODESTR_DECR_REF'];
- {$endif FPC_HAS_UNICODESTR_DECR_REF}
- {$ifndef FPC_HAS_UNICODESTR_INCR_REF}
- {$define FPC_HAS_UNICODESTR_INCR_REF}
- Procedure fpc_UnicodeStr_Incr_Ref(S : Pointer);[Public,Alias:'FPC_UNICODESTR_INCR_REF']; compilerproc;
- Begin
- If S=Nil then
- exit;
- { constant string ? }
- If PUnicodeRec(S-UnicodeFirstOff)^.Ref<0 then
- exit;
- inclocked(PUnicodeRec(S-UnicodeFirstOff)^.Ref);
- end;
- { alias for internal use }
- Procedure fpc_UnicodeStr_Incr_Ref (S : Pointer);[external name 'FPC_UNICODESTR_INCR_REF'];
- {$endif FPC_HAS_UNICODESTR_INCR_REF}
- {$ifndef FPC_HAS_UNICODESTR_TO_SHORTSTR}
- {$define FPC_HAS_UNICODESTR_TO_SHORTSTR}
- procedure fpc_UnicodeStr_To_ShortStr (out res: ShortString;const S2 : UnicodeString); [Public, alias: 'FPC_UNICODESTR_TO_SHORTSTR'];compilerproc;
- {
- Converts a UnicodeString to a ShortString;
- }
- Var
- Size : SizeInt;
- temp : ansistring;
- begin
- res:='';
- Size:=Length(S2);
- if Size>0 then
- begin
- If Size>high(res) then
- Size:=high(res);
- widestringmanager.Unicode2AnsiMoveProc(PUnicodeChar(S2),temp,DefaultSystemCodePage,Size);
- res:=temp;
- end;
- end;
- {$endif FPC_HAS_UNICODESTR_TO_SHORTSTR}
- {$ifndef FPC_HAS_SHORTSTR_TO_UNICODESTR}
- {$define FPC_HAS_SHORTSTR_TO_UNICODESTR}
- Function fpc_ShortStr_To_UnicodeStr (Const S2 : ShortString): UnicodeString;compilerproc;
- {
- Converts a ShortString to a UnicodeString;
- }
- Var
- Size : SizeInt;
- begin
- result:='';
- Size:=Length(S2);
- if Size>0 then
- widestringmanager.Ansi2UnicodeMoveProc(PAnsiChar(@S2[1]),DefaultSystemCodePage,result,Size);
- end;
- {$endif FPC_HAS_SHORTSTR_TO_UNICODESTR}
- {$ifndef FPC_HAS_UNICODESTR_TO_ANSISTR}
- {$define FPC_HAS_UNICODESTR_TO_ANSISTR}
- Function fpc_UnicodeStr_To_AnsiStr (const S2 : UnicodeString{$ifdef FPC_HAS_CPSTRING};cp : TSystemCodePage{$endif FPC_HAS_CPSTRING}): AnsiString; compilerproc;
- {
- Converts a UnicodeString to an AnsiString
- }
- Var
- Size : SizeInt;
- {$ifndef FPC_HAS_CPSTRING}
- cp : TSystemCodePage;
- {$endif FPC_HAS_CPSTRING}
- begin
- {$ifndef FPC_HAS_CPSTRING}
- cp:=DefaultSystemCodePage;
- {$endif FPC_HAS_CPSTRING}
- result:='';
- Size:=Length(S2);
- if Size>0 then
- begin
- cp:=TranslatePlaceholderCP(cp);
- widestringmanager.Unicode2AnsiMoveProc(PUnicodeChar(Pointer(S2)),result,cp,Size);
- end;
- end;
- {$endif FPC_HAS_UNICODESTR_TO_ANSISTR}
- {$ifndef FPC_HAS_ANSISTR_TO_UNICODESTR}
- {$define FPC_HAS_ANSISTR_TO_UNICODESTR}
- Function fpc_AnsiStr_To_UnicodeStr (Const S2 : RawByteString): UnicodeString; compilerproc;
- {
- Converts an AnsiString to a UnicodeString;
- }
- Var
- Size : SizeInt;
- cp: TSystemCodePage;
- begin
- result:='';
- Size:=Length(S2);
- if Size>0 then
- begin
- cp:=TranslatePlaceholderCP(StringCodePage(S2));
- widestringmanager.Ansi2UnicodeMoveProc(PAnsiChar(S2),cp,result,Size);
- end;
- end;
- {$endif FPC_HAS_ANSISTR_TO_UNICODESTR}
- {$ifndef FPC_HAS_UNICODESTR_TO_WIDESTR}
- {$define FPC_HAS_UNICODESTR_TO_WIDESTR}
- Function fpc_UnicodeStr_To_WideStr (const S2 : UnicodeString): WideString; compilerproc;
- begin
- SetLength(Result,Length(S2));
- Move(pointer(S2)^,Pointer(Result)^,Length(S2)*sizeof(WideChar));
- end;
- {$endif FPC_HAS_UNICODESTR_TO_WIDESTR}
- {$ifndef FPC_HAS_WIDESTR_TO_UNICODESTR}
- {$define FPC_HAS_WIDESTR_TO_UNICODESTR}
- Function fpc_WideStr_To_UnicodeStr (Const S2 : WideString): UnicodeString; compilerproc;
- begin
- SetLength(Result,Length(S2));
- Move(pointer(S2)^,Pointer(Result)^,Length(S2)*sizeof(WideChar));
- end;
- {$endif FPC_HAS_WIDESTR_TO_UNICODESTR}
- {$ifndef FPC_HAS_PWIDECHAR_TO_UNICODESTR}
- {$define FPC_HAS_PWIDECHAR_TO_UNICODESTR}
- Function fpc_PWideChar_To_UnicodeStr(const p : pwidechar): unicodestring; compilerproc;
- var
- Size : SizeInt;
- begin
- result:='';
- if p=nil then
- exit;
- Size := IndexWord(p^, -1, 0);
- Setlength(result,Size);
- if Size>0 then
- Move(p^,PUnicodeChar(Pointer(result))^,Size*sizeof(UnicodeChar));
- end;
- {$endif FPC_HAS_PWIDECHAR_TO_UNICODESTR}
- {$ifndef FPC_HAS_PWIDECHAR_TO_ANSISTR}
- {$define FPC_HAS_PWIDECHAR_TO_ANSISTR}
- Function fpc_PWideChar_To_AnsiStr(const p : pwidechar{$ifdef FPC_HAS_CPSTRING};cp : TSystemCodePage{$endif FPC_HAS_CPSTRING}): ansistring; compilerproc;
- var
- Size : SizeInt;
- {$ifndef FPC_HAS_CPSTRING}
- cp : TSystemCodePage;
- {$endif FPC_HAS_CPSTRING}
- begin
- {$ifndef FPC_HAS_CPSTRING}
- cp:=DefaultSystemCodePage;
- {$endif FPC_HAS_CPSTRING}
- result:='';
- if p=nil then
- exit;
- Size := IndexWord(p^, -1, 0);
- if Size>0 then
- begin
- cp:=TranslatePlaceholderCP(cp);
- widestringmanager.Wide2AnsiMoveProc(P,result,cp,Size);
- end;
- end;
- {$endif FPC_HAS_PWIDECHAR_TO_ANSISTR}
- {$ifndef FPC_HAS_PWIDECHAR_TO_SHORTSTR}
- {$define FPC_HAS_PWIDECHAR_TO_SHORTSTR}
- procedure fpc_PWideChar_To_ShortStr(out res : shortstring;const p : pwidechar); compilerproc;
- var
- Size : SizeInt;
- temp: ansistring;
- begin
- res:='';
- if p=nil then
- exit;
- Size:=IndexWord(p^, high(PtrInt), 0);
- if Size>0 then
- begin
- widestringmanager.Wide2AnsiMoveProc(p,temp,DefaultSystemCodePage,Size);
- res:=temp;
- end;
- end;
- {$endif FPC_HAS_PWIDECHAR_TO_SHORTSTR}
- {$ifndef FPC_HAS_UNICODESTR_ASSIGN}
- {$define FPC_UNICODESTR_ASSIGN}
- { checked against the ansistring routine, 2001-05-27 (FK) }
- Procedure fpc_UnicodeStr_Assign (Var S1 : Pointer;S2 : Pointer);[Public,Alias:'FPC_UNICODESTR_ASSIGN']; compilerproc;
- {
- Assigns S2 to S1 (S1:=S2), taking in account reference counts.
- }
- begin
- If S2<>nil then
- If PUnicodeRec(S2-UnicodeFirstOff)^.Ref>0 then
- inclocked(PUnicodeRec(S2-UnicodeFirstOff)^.ref);
- { Decrease the reference count on the old S1 }
- fpc_unicodestr_decr_ref (S1);
- s1:=s2;
- end;
- { alias for internal use }
- Procedure fpc_UnicodeStr_Assign (Var S1 : Pointer;S2 : Pointer);[external name 'FPC_UNICODESTR_ASSIGN'];
- {$endif FPC_UNICODESTR_ASSIGN}
- {$ifndef FPC_HAS_UNICODESTR_CONCAT}
- {$define FPC_HAS_UNICODESTR_CONCAT}
- procedure fpc_UnicodeStr_Concat (var DestS:Unicodestring;const S1,S2 : UnicodeString); compilerproc;
- Var
- S1Len,S2Len : SizeInt;
- OldDestP,NewDestP,RealDestP,Src : Pointer;
- begin
- { only assign if s1 or s2 is empty }
- if Length(S1)=0 then
- begin
- DestS:=s2;
- exit;
- end;
- if Length(S2)=0 then
- begin
- DestS:=s1;
- exit;
- end;
- S1Len:=PUnicodeRec(Pointer(S1)-UnicodeFirstOff)^.Len;
- S2Len:=PUnicodeRec(Pointer(S2)-UnicodeFirstOff)^.Len;
- OldDestP:=Pointer(DestS);
- { Reallocate when possible; in the hope this will reuse the chunk more often than do a redundant copy. }
- if Assigned(OldDestP) and (PUnicodeRec(OldDestP-UnicodeFirstOff)^.Ref=1) then
- begin
- RealDestP:=OldDestP-UnicodeFirstOff;
- NewDestP:=ReallocMem(RealDestP,UnicodeFirstOff+sizeof(UnicodeChar)+(S1Len+S2Len)*sizeof(UnicodeChar))+UnicodeFirstOff;
- { Copy S2 first, as in the case of OldDestP = Pointer(S2) it must be copied first and in other cases the order does not matter. }
- Src:=Pointer(S2);
- if Src=OldDestP then
- Src:=NewDestP;
- Move(Src^,PUnicodeChar(NewDestP)[S1Len],S2Len*sizeof(UnicodeChar));
- if OldDestP<>Pointer(S1) then { Not an append, need to copy S1? }
- Move(Pointer(S1)^,NewDestP^,S1Len*sizeof(UnicodeChar));
- end
- else
- begin
- NewDestP:=NewUnicodeString(S1Len+S2Len);
- Move(Pointer(S1)^,NewDestP^,S1Len*sizeof(UnicodeChar));
- Move(Pointer(S2)^,PUnicodeChar(NewDestP)[S1Len],S2Len*sizeof(UnicodeChar));
- fpc_unicodestr_decr_ref(Pointer(DestS));
- end;
- PUnicodeChar(NewDestP)[S1Len+S2Len]:=#0;
- PUnicodeRec(NewDestP-UnicodeFirstOff)^.Len:=S1Len+S2Len;
- Pointer(DestS):=NewDestP;
- end;
- {$endif FPC_HAS_UNICODESTR_CONCAT}
- {$ifndef FPC_HAS_UNICODESTR_CONCAT_MULTI}
- {$define FPC_HAS_UNICODESTR_CONCAT_MULTI}
- procedure fpc_UnicodeStr_Concat_multi (var DestS:Unicodestring;const sarr:array of Unicodestring); compilerproc;
- Var
- lowstart,i,Size,NewLen : SizeInt;
- p,pc,OldDestP,NewDestP,RealDestP : pointer;
- begin
- lowstart:=low(sarr);
- { skip empty strings }
- while (lowstart<=high(sarr)) and (sarr[lowstart]='') do
- inc(lowstart);
- if lowstart>high(sarr) then
- begin
- DestS:=''; { All source strings empty }
- exit;
- end;
- { Calculate size of the result so we can do
- a single call to SetLength() }
- NewLen:=0;
- for i:=lowstart to high(sarr) do
- inc(NewLen,length(sarr[i]));
- { In the case of the only nonempty string, return it directly. }
- if NewLen=PUnicodeRec(Pointer(sarr[lowstart])-UnicodeFirstOff)^.Len then
- begin
- DestS:=sarr[lowstart];
- exit;
- end;
- OldDestP:=Pointer(DestS);
- { Reallocate when possible; in the hope this will reuse the chunk more often than do a redundant copy. }
- if Assigned(OldDestP) and (PUnicodeRec(OldDestP-UnicodeFirstOff)^.Ref=1) then
- begin
- RealDestP:=OldDestP-UnicodeFirstOff;
- NewDestP:=ReallocMem(RealDestP,UnicodeFirstOff+sizeof(UnicodeChar)+NewLen*sizeof(UnicodeChar))+UnicodeFirstOff;
- { First string can be skipped if appending. }
- if OldDestP=Pointer(sarr[lowstart]) then
- inc(lowstart);
- end
- else
- begin
- { Create new string. }
- OldDestP:=nil; { This case is distinguished as "not assigned(olddestp)". Also prevents "if p=olddestp" in the loop below shared with the ReallocMem branch. }
- NewDestP:=NewUnicodeString(NewLen);
- end;
- { Copy strings from last to the first, so that possible occurences of DestS could read from the beginning of the reallocated DestS. }
- pc:=NewDestP+NewLen*sizeof(UnicodeChar);
- for i:=high(sarr) downto lowstart do
- begin
- p:=Pointer(sarr[i]);
- if not Assigned(p) then
- continue;
- if p=OldDestP then
- { DestS occured among pieces in the ReallocMem case! Use the new pointer. Its header still conveniently contains old DestS length. }
- p:=NewDestP;
- Size:=PUnicodeRec(p-UnicodeFirstOff)^.Len*sizeof(UnicodeChar);
- dec(pc,size);
- Move(p^,pc^,Size);
- end;
- if not assigned(OldDestP) then
- fpc_UnicodeStr_Decr_Ref(Pointer(DestS));
- PUnicodeChar(NewDestP)[NewLen]:=#0;
- PUnicodeRec(NewDestP-UnicodeFirstOff)^.Len:=NewLen; { Careful, loop above relies on the old Len in the NewDestP header. }
- Pointer(DestS):=NewDestP;
- end;
- {$endif FPC_HAS_UNICODESTR_CONCAT_MULTI}
- {$ifndef FPC_HAS_CHAR_TO_UCHAR}
- {$define FPC_HAS_CHAR_TO_UCHAR}
- Function fpc_Char_To_UChar(const c : AnsiChar): UnicodeChar; compilerproc;
- var
- w: unicodestring;
- begin
- widestringmanager.Ansi2UnicodeMoveProc(@c,DefaultSystemCodePage,w,1);
- fpc_Char_To_UChar:=w[1];
- end;
- {$endif FPC_HAS_CHAR_TO_UCHAR}
- {$ifndef FPC_HAS_CHAR_TO_UNICODESTR}
- {$define FPC_HAS_CHAR_TO_UNICODESTR}
- Function fpc_Char_To_UnicodeStr(const c : AnsiChar): UnicodeString; compilerproc;
- {
- Converts a AnsiChar to a UnicodeString;
- }
- begin
- widestringmanager.Ansi2UnicodeMoveProc(@c,DefaultSystemCodePage,result,1);
- end;
- {$endif FPC_HAS_CHAR_TO_UNICODESTR}
- {$ifndef FPC_HAS_UCHAR_TO_CHAR}
- {$define FPC_HAS_UCHAR_TO_CHAR}
- Function fpc_UChar_To_Char(const c : UnicodeChar): AnsiChar; compilerproc;
- {
- Converts a UnicodeChar to a AnsiChar;
- }
- var
- s: ansistring;
- begin
- widestringmanager.Unicode2AnsiMoveProc(@c, s, DefaultSystemCodePage, 1);
- if length(s)=1 then
- fpc_UChar_To_Char:= s[1]
- else
- fpc_UChar_To_Char:='?';
- end;
- {$endif FPC_HAS_UCHAR_TO_CHAR}
- {$ifndef FPC_HAS_UCHAR_TO_SHORTSTR}
- {$define FPC_HAS_UCHAR_TO_SHORTSTR}
- function fpc_UChar_To_ShortStr(const c : WideChar): shortstring; compilerproc;
- {
- Converts a WideChar to a ShortString;
- }
- var
- s: ansistring;
- begin
- widestringmanager.Wide2AnsiMoveProc(@c,s,DefaultSystemCodePage,1);
- result:=s;
- end;
- {$endif FPC_HAS_UCHAR_TO_SHORTSTR}
- {$ifndef FPC_HAS_UCHAR_TO_UNICODESTR}
- {$define FPC_HAS_UCHAR_TO_UNICODESTR}
- Function fpc_UChar_To_UnicodeStr(const c : UnicodeChar): UnicodeString; compilerproc;
- {
- Converts a UnicodeChar to a UnicodeString;
- }
- begin
- Setlength (fpc_UChar_To_UnicodeStr,1);
- fpc_UChar_To_UnicodeStr[1]:= c;
- end;
- {$endif FPC_HAS_UCHAR_TO_UNICODESTR}
- {$ifndef FPC_HAS_UCHAR_TO_ANSISTR}
- {$define FPC_HAS_UCHAR_TO_ANSISTR}
- Function fpc_UChar_To_AnsiStr(const c : UnicodeChar{$ifdef FPC_HAS_CPSTRING};cp : TSystemCodePage{$endif FPC_HAS_CPSTRING}): AnsiString; compilerproc;
- {
- Converts a UnicodeChar to a AnsiString;
- }
- {$ifndef FPC_HAS_CPSTRING}
- var
- cp : TSystemCodePage;
- {$endif FPC_HAS_CPSTRING}
- begin
- {$ifndef FPC_HAS_CPSTRING}
- cp:=DefaultSystemCodePage;
- {$endif FPC_HAS_CPSTRING}
- cp:=TranslatePlaceholderCP(cp);
- widestringmanager.Unicode2AnsiMoveProc(@c, fpc_UChar_To_AnsiStr, cp, 1);
- end;
- {$endif FPC_HAS_UCHAR_TO_ANSISTR}
- {$ifndef FPC_HAS_PCHAR_TO_UNICODESTR}
- {$define FPC_HAS_PCHAR_TO_UNICODESTR}
- Function fpc_PChar_To_UnicodeStr(const p : PAnsiChar): UnicodeString; compilerproc;
- Var
- L : SizeInt;
- begin
- if (not assigned(p)) or (p[0]=#0) Then
- begin
- fpc_pchar_to_unicodestr := '';
- exit;
- end;
- l:=IndexChar(p^,-1,#0);
- widestringmanager.Ansi2UnicodeMoveProc(P,DefaultSystemCodePage,fpc_PChar_To_UnicodeStr,l);
- end;
- {$endif FPC_HAS_PCHAR_TO_UNICODESTR}
- {$ifndef FPC_HAS_CHARARRAY_TO_UNICODESTR}
- {$define FPC_HAS_CHARARRAY_TO_UNICODESTR}
- Function fpc_CharArray_To_UnicodeStr(const arr: array of ansichar; zerobased: boolean = true): UnicodeString; compilerproc;
- var
- i : SizeInt;
- begin
- if zerobased then
- begin
- if arr[0]=#0 Then
- begin
- fpc_chararray_to_unicodestr:='';
- exit;
- end;
- i:=IndexChar(arr,high(arr)+1,#0);
- if i=-1 then
- i:=high(arr)+1;
- end
- else
- i:=high(arr)+1;
- widestringmanager.Ansi2UnicodeMoveProc(pansichar(@arr),DefaultSystemCodePage,fpc_CharArray_To_UnicodeStr,i);
- end;
- {$endif FPC_HAS_CHARARRAY_TO_UNICODESTR}
- {$ifndef FPC_HAS_WIDECHARARRAY_TO_UNICODESTR}
- {$define FPC_HAS_WIDECHARARRAY_TO_UNICODESTR}
- Function fpc_WideCharArray_To_UnicodeStr(const arr: array of widechar; zerobased: boolean = true): UnicodeString; compilerproc;
- var
- i : SizeInt;
- begin
- if (zerobased) then
- begin
- i:=IndexWord(arr,high(arr)+1,0);
- if i = -1 then
- i := high(arr)+1;
- end
- else
- i := high(arr)+1;
- SetLength(fpc_WideCharArray_To_UnicodeStr,i);
- Move(arr[0], Pointer(fpc_WideCharArray_To_UnicodeStr)^,i*sizeof(WideChar));
- end;
- {$endif FPC_HAS_WIDECHARARRAY_TO_UNICODESTR}
- {$ifndef FPC_HAS_WIDECHARARRAY_TO_SHORTSTR}
- {$define FPC_HAS_WIDECHARARRAY_TO_SHORTSTR}
- { due to their names, the following procedures should be in wstrings.inc,
- however, the compiler generates code using this functions on all platforms }
- procedure fpc_WideCharArray_To_ShortStr(out res : shortstring;const arr: array of widechar; zerobased: boolean = true);[public,alias:'FPC_WIDECHARARRAY_TO_SHORTSTR']; compilerproc;
- var
- l: longint;
- index: ptrint;
- len: byte;
- temp: ansistring;
- begin
- l := high(arr)+1;
- if l>=high(res)+1 then
- l:=high(res)
- else if l<0 then
- l:=0;
- if zerobased then
- begin
- index:=IndexWord(arr[0],l,0);
- if index<0 then
- len:=l
- else
- len:=index;
- end
- else
- len:=l;
- widestringmanager.Wide2AnsiMoveProc (pwidechar(@arr),temp,DefaultSystemCodePage,len);
- res:=temp;
- end;
- {$endif FPC_HAS_WIDECHARARRAY_TO_SHORTSTR}
- {$ifndef FPC_HAS_WIDECHARARRAY_TO_ANSISTR}
- {$define FPC_HAS_WIDECHARARRAY_TO_ANSISTR}
- Function fpc_WideCharArray_To_AnsiStr(const arr: array of widechar; {$ifdef FPC_HAS_CPSTRING}cp : TSystemCodePage;{$endif FPC_HAS_CPSTRING} zerobased: boolean = true): AnsiString; compilerproc;
- var
- i : SizeInt;
- {$ifndef FPC_HAS_CPSTRING}
- cp : TSystemCodePage;
- {$endif FPC_HAS_CPSTRING}
- begin
- {$ifndef FPC_HAS_CPSTRING}
- cp:=DefaultSystemCodePage;
- {$endif FPC_HAS_CPSTRING}
- if (zerobased) then
- begin
- i:=IndexWord(arr,high(arr)+1,0);
- if i = -1 then
- i := high(arr)+1;
- end
- else
- i := high(arr)+1;
- if i > 0 then
- begin
- cp:=TranslatePlaceholderCP(cp);
- widestringmanager.Wide2AnsiMoveProc (pwidechar(@arr),RawByteString(fpc_WideCharArray_To_AnsiStr),cp,i);
- end
- else
- fpc_WideCharArray_To_AnsiStr:='';
- end;
- {$endif FPC_HAS_WIDECHARARRAY_TO_ANSISTR}
- {$ifndef FPC_HAS_WIDECHARARRAY_TO_WIDESTR}
- {$define FPC_HAS_WIDECHARARRAY_TO_WIDESTR}
- Function fpc_WideCharArray_To_WideStr(const arr: array of widechar; zerobased: boolean = true): WideString; compilerproc;
- var
- i : SizeInt;
- begin
- if (zerobased) then
- begin
- i:=IndexWord(arr,high(arr)+1,0);
- if i = -1 then
- i := high(arr)+1;
- end
- else
- i := high(arr)+1;
- SetLength(fpc_WideCharArray_To_WideStr,i);
- Move(arr[0], Pointer(fpc_WideCharArray_To_WideStr)^,i*sizeof(WideChar));
- end;
- {$endif FPC_HAS_WIDECHARARRAY_TO_WIDESTR}
- {$ifndef FPC_HAS_UNICODESTR_TO_CHARARRAY}
- {$define FPC_HAS_UNICODESTR_TO_CHARARRAY}
- procedure fpc_unicodestr_to_chararray(out res: array of AnsiChar; const src: UnicodeString); compilerproc;
- var
- len: SizeInt;
- temp: ansistring;
- begin
- len := length(src);
- { make sure we don't dereference src if it can be nil (JM) }
- if len > 0 then
- widestringmanager.unicode2ansimoveproc(punicodechar(@src[1]),temp,DefaultSystemCodePage,len);
- len := length(temp);
- if len > length(res) then
- len := length(res);
- {$push}
- {$r-}
- move(temp[1],res[0],len);
- fillchar(res[len],length(res)-len,0);
- {$pop}
- end;
- {$endif FPC_HAS_UNICODESTR_TO_UNICODECHARARRAY}
- {$ifndef FPC_HAS_ANSISTR_TO_WIDECHARARRAY}
- {$define FPC_HAS_ANSISTR_TO_WIDECHARARRAY}
- procedure fpc_ansistr_to_widechararray(out res: array of widechar; const src: RawByteString); compilerproc;
- var
- len: SizeInt;
- temp: widestring;
- begin
- len := length(src);
- { make sure we don't dereference src if it can be nil (JM) }
- if len > 0 then
- widestringmanager.ansi2widemoveproc(pansichar(@src[1]),TranslatePlaceholderCP(StringCodePage(src)),temp,len);
- len := length(temp);
- if len > length(res) then
- len := length(res);
- {$push}
- {$r-}
- move(temp[1],res[0],len*sizeof(widechar));
- fillchar(res[len],(length(res)-len)*SizeOf(WideChar),0);
- {$pop}
- end;
- {$endif FPC_HAS_ANSISTR_TO_WIDECHARARRAY}
- {$ifndef FPC_HAS_SHORTSTR_TO_WIDECHARARRAY}
- {$define FPC_HAS_SHORTSTR_TO_WIDECHARARRAY}
- procedure fpc_shortstr_to_widechararray(out res: array of widechar; const src: ShortString); compilerproc;
- var
- len: longint;
- temp : widestring;
- begin
- len := length(src);
- { make sure we don't access AnsiChar 1 if length is 0 (JM) }
- if len > 0 then
- widestringmanager.ansi2widemoveproc(pansichar(@src[1]),DefaultSystemCodePage,temp,len);
- len := length(temp);
- if len > length(res) then
- len := length(res);
- {$push}
- {$r-}
- move(temp[1],res[0],len*sizeof(widechar));
- fillchar(res[len],(length(res)-len)*SizeOf(WideChar),0);
- {$pop}
- end;
- {$endif FPC_HAS_SHORTSTR_TO_WIDECHARARRAY}
- {$ifndef FPC_HAS_UNICODESTR_TO_WIDECHARARRAY}
- {$define FPC_HAS_UNICODESTR_TO_WIDECHARARRAY}
- procedure fpc_unicodestr_to_widechararray(out res: array of widechar; const src: UnicodeString); compilerproc;
- var
- len: SizeInt;
- begin
- len := length(src);
- if len > length(res) then
- len := length(res);
- {$push}
- {$r-}
- { make sure we don't try to access element 1 of the widestring if it's nil }
- if len > 0 then
- move(src[1],res[0],len*SizeOf(WideChar));
- fillchar(res[len],(length(res)-len)*SizeOf(WideChar),0);
- {$pop}
- end;
- {$endif FPC_HAS_UNICODESTR_TO_WIDECHARARRAY}
- {$ifndef FPC_HAS_UNICODESTR_COMPARE}
- {$define FPC_HAS_UNICODESTR_COMPARE}
- Function fpc_UnicodeStr_Compare(const S1,S2 : UnicodeString): SizeInt;[Public,Alias : 'FPC_UNICODESTR_COMPARE']; compilerproc;
- {
- Compares 2 UnicodeStrings;
- The result is
- <0 if S1<S2
- 0 if S1=S2
- >0 if S1>S2
- }
- Var
- MaxI,Temp : SizeInt;
- begin
- if pointer(S1)=pointer(S2) then
- begin
- fpc_UnicodeStr_Compare:=0;
- exit;
- end;
- Maxi:=Length(S1);
- temp:=Length(S2);
- If MaxI>Temp then
- MaxI:=Temp;
- Temp:=CompareWord(S1[1],S2[1],MaxI);
- if temp=0 then
- temp:=Length(S1)-Length(S2);
- fpc_UnicodeStr_Compare:=Temp;
- end;
- {$endif FPC_HAS_UNICODESTR_COMPARE}
- {$ifndef FPC_HAS_UNICODESTR_COMPARE_EQUAL}
- {$define FPC_HAS_UNICODESTR_COMPARE_EQUAL}
- Function fpc_UnicodeStr_Compare_Equal(const S1,S2 : UnicodeString): SizeInt;[Public,Alias : 'FPC_UNICODESTR_COMPARE_EQUAL']; compilerproc;
- {
- Compares 2 UnicodeStrings for equality only;
- The result is
- 0 if S1=S2
- <>0 if S1<>S2
- }
- Var
- MaxI : SizeInt;
- begin
- if pointer(S1)=pointer(S2) then
- exit(0);
- Maxi:=Length(S1);
- If MaxI<>Length(S2) then
- exit(-1)
- else
- exit(CompareWord(S1[1],S2[1],MaxI));
- end;
- {$endif FPC_HAS_UNICODESTR_COMPARE_EQUAL}
- {$ifndef FPC_HAS_UNICODESTR_RANGECHECK}
- {$define FPC_HAS_UNICODESTR_RANGECHECK}
- Procedure fpc_UnicodeStr_RangeCheck(p: Pointer; index: SizeInt);[Public,Alias : 'FPC_UNICODESTR_RANGECHECK']; compilerproc;
- begin
- if (p=nil) or (index>PUnicodeRec(p-UnicodeFirstOff)^.len) or (Index<1) then
- HandleErrorAddrFrameInd(201,get_pc_addr,get_frame);
- end;
- Procedure fpc_UnicodeStr_ZeroBased_RangeCheck(p: Pointer; index: SizeInt);[Public,Alias : 'FPC_UNICODESTR_ZEROBASED_RANGECHECK']; compilerproc;
- begin
- if (p=nil) or (index>=PUnicodeRec(p-UnicodeFirstOff)^.len) or (Index<0) then
- HandleErrorAddrFrameInd(201,get_pc_addr,get_frame);
- end;
- {$endif FPC_HAS_UNICODESTR_RANGECHECK}
- {$ifndef FPC_HAS_UNICODESTR_SETLENGTH}
- {$define FPC_HAS_UNICODESTR_SETLENGTH}
- Procedure fpc_UnicodeStr_SetLength(Var S : UnicodeString; l : SizeInt);[Public,Alias : 'FPC_UNICODESTR_SETLENGTH']; compilerproc;
- {
- Sets The length of string S to L.
- Makes sure S is unique, and contains enough room.
- }
- Var
- Temp : Pointer;
- lens, lena : SizeUInt;
- begin
- if (l>0) then
- begin
- if Pointer(S)=nil then
- begin
- { Need a complete new string...}
- Pointer(s):=NewUnicodeString(l);
- end
- else
- if (PUnicodeRec(Pointer(S)-UnicodeFirstOff)^.Ref = 1) then
- begin
- Temp:=Pointer(s)-UnicodeFirstOff;
- lens:=MemSize(Temp);
- lena:=SizeUInt(L*sizeof(UnicodeChar)+(UnicodeFirstOff+sizeof(UnicodeChar)));
- if (lena>lens) or ((lens>32) and (lena<=SizeInt(SizeUint(lens) div 2))) then
- Pointer(S):=reallocmem(Temp, lena)+UnicodeFirstOff;
- end
- else
- begin
- { Reallocation is needed... }
- Temp:=NewUnicodeString(l);
- { also move terminating null }
- lens:=PUnicodeRec(Pointer(S)-UnicodeFirstOff)^.Len+1;
- if l<lens then
- lens:=l;
- Move(Pointer(S)^,Temp^,lens * Sizeof(UnicodeChar));
- fpc_unicodestr_decr_ref(Pointer(S));
- Pointer(S):=Temp;
- end;
- { Force nil termination in case it gets shorter }
- PWord(Pointer(S)+l*sizeof(UnicodeChar))^:=0;
- PUnicodeRec(Pointer(S)-UnicodeFirstOff)^.Len:=l;
- end
- else { length=0, deallocate the string }
- fpc_unicodestr_decr_ref (Pointer(S));
- end;
- {$endif FPC_HAS_UNICODESTR_SETLENGTH}
- {*****************************************************************************
- Public functions, In interface.
- *****************************************************************************}
- function UnicodeCharToString(S : PUnicodeChar) : UnicodeString;
- begin
- result:=UnicodeCharLenToString(s,Length(UnicodeString(s)));
- end;
- {$ifndef FPC_HAS_STRING_TO_UNICODECHAR}
- {$define FPC_HAS_STRING_TO_UNICODECHAR}
- function StringToUnicodeChar(const Src : RawByteString;Dest : PUnicodeChar;DestSize : SizeInt) : PUnicodeChar;
- begin
- result:=StringToWideChar(Src,Dest,DestSize);
- end;
- {$endif FPC_HAS_STRING_TO_UNICODECHAR}
- function WideCharToString(S : PWideChar) : UnicodeString;
- begin
- result:=WideCharLenToString(s,Length(WideString(s)));
- end;
- {$ifndef FPC_HAS_STRING_LEN_TO_WIDECHAR}
- {$define FPC_HAS_STRING_LEN_TO_WIDECHAR}
- function StringToWideChar(const Src : RawByteString;Dest : PWideChar;DestSize : SizeInt) : PWideChar;
- var
- temp: widestring;
- Len: SizeInt;
- begin
- widestringmanager.Ansi2WideMoveProc(PAnsiChar(Src),StringCodePage(Src),temp,Length(Src));
- Len:=Length(temp);
- if DestSize<=Len then
- Len:=Destsize-1;
- move(temp[1],Dest^,Len*SizeOf(WideChar));
- Dest[Len]:=#0;
- result:=Dest;
- end;
- {$endif FPC_HAS_STRING_LEN_TO_WIDECHAR}
- {$ifndef FPC_HAS_UNICODEFROMLOCALECHARS}
- {$define FPC_HAS_UNICODEFROMLOCALECHARS}
- function UnicodeFromLocaleChars(CodePage, Flags: Cardinal; LocaleStr: PAnsiChar;
- LocaleStrLen: Integer; UnicodeStr: PWideChar; UnicodeStrLen: Integer): Integer; overload;
- var
- temp: widestring;
- Len: SizeInt;
- begin
- widestringmanager.Ansi2WideMoveProc(LocaleStr,CodePage,temp,LocaleStrLen);
- Len:=Length(temp);
- // Only move when we have room.
- if (UnicodeStrLen>0) then
- begin
- if UnicodeStrLen<=Len then
- Len:=UnicodeStrLen-1;
- move(temp[1],UnicodeStr^,Len*SizeOf(WideChar));
- UnicodeStr[Len]:=#0;
- end;
- // Return length
- result:=len;
- end;
- {$endif ndef FPC_HAS_UNICODEFROMLOCALECHARS}
- function UnicodeFromLocaleChars(const LocaleName: AnsiString; Flags: Cardinal;
- LocaleStr: PAnsiChar; LocaleStrLen: Integer; UnicodeStr: PWideChar;
- UnicodeStrLen: Integer): Integer; overload;
- var
- CP : TSystemCodePage;
- begin
- if not LocaleNameToCodePage(LocaleName,CP) then
- Result:=0
- else
- Result:=UnicodeFromLocaleChars(CP,Flags,LocaleStr,LocaleStrLen,UnicodeStr,UnicodeStrLen);
- end;
- {$ifndef FPC_HAS_UNICODECHAR_LEN_TO_STRING}
- {$define FPC_HAS_UNICODECHAR_LEN_TO_STRING}
- function UnicodeCharLenToString(S : PUnicodeChar;Len : SizeInt) : UnicodeString;
- begin
- SetLength(result,Len);
- Move(S^,Pointer(Result)^,Len*2);
- end;
- {$endif FPC_HAS_UNICODECHAR_LEN_TO_STRING}
- procedure UnicodeCharLenToStrVar(Src : PUnicodeChar;Len : SizeInt;out Dest : UnicodeString);
- begin
- Dest:=UnicodeCharLenToString(Src,Len);
- end;
- procedure UnicodeCharLenToStrVar(Src : PUnicodeChar;Len : SizeInt;out Dest : AnsiString);
- begin
- Dest:=AnsiString(UnicodeCharLenToString(Src,Len));
- end;
- procedure UnicodeCharToStrVar(S : PUnicodeChar;out Dest : AnsiString);
- begin
- Dest:=AnsiString(UnicodeCharToString(S));
- end;
- {$ifndef FPC_HAS_WIDECHAR_LEN_TO_STRING}
- {$define FPC_HAS_WIDECHAR_LEN_TO_STRING}
- function WideCharLenToString(S : PWideChar;Len : SizeInt) : UnicodeString;
- begin
- SetLength(result,Len);
- Move(S^,Pointer(Result)^,Len*2);
- end;
- {$endif FPC_HAS_WIDECHAR_LEN_TO_STRING}
- procedure WideCharLenToStrVar(Src : PWideChar;Len : SizeInt;out Dest : UnicodeString);
- begin
- Dest:=WideCharLenToString(Src,Len);
- end;
- procedure WideCharLenToStrVar(Src : PWideChar;Len : SizeInt;out Dest : AnsiString);
- begin
- Dest:=AnsiString(WideCharLenToString(Src,Len));
- end;
- procedure WideCharToStrVar(S : PWideChar;out Dest : UnicodeString);
- begin
- Dest:=WideCharToString(S);
- end;
- procedure WideCharToStrVar(S : PWideChar;out Dest : AnsiString);
- begin
- Dest:=AnsiString(WideCharToString(S));
- end;
- Function fpc_unicodestr_Unique_func(Var S : UnicodeString): Pointer; external name 'FPC_UNICODESTR_UNIQUE';
- Procedure UniqueString (Var S : UnicodeString);{$ifdef SYSTEMINLINE}inline;{$endif}
- begin
- fpc_unicodestr_Unique_func(S);
- end;
- {$ifndef FPC_HAS_UNICODESTR_UNIQUE}
- {$define FPC_HAS_UNICODESTR_UNIQUE}
- Function fpc_unicodestr_Unique(Var S : Pointer): Pointer; [Public,Alias : 'FPC_UNICODESTR_UNIQUE']; compilerproc;
- {
- Make sure reference count of S is 1,
- using copy-on-write semantics.
- }
- Var
- SNew : Pointer;
- L : SizeInt;
- begin
- pointer(result) := pointer(s);
- If (result<>nil) and (PUnicodeRec(result-UnicodeFirstOff)^.Ref<>1) then
- begin
- L:=PUnicodeRec(Pointer(S)-UnicodeFirstOff)^.len;
- SNew:=NewUnicodeString (L);
- Move (PUnicodeChar(S)^,SNew^,(L+1)*sizeof(UnicodeChar));
- PUnicodeRec(SNew-UnicodeFirstOff)^.len:=L;
- fpc_unicodestr_decr_ref (Pointer(S)); { Thread safe }
- pointer(S):=SNew;
- pointer(result):=SNew;
- end;
- end;
- {$endif FPC_HAS_UNICODESTR_UNIQUE}
- {$ifndef FPC_HAS_UNICODESTR_COPY}
- {$define FPC_HAS_UNICODESTR_COPY}
- Function Fpc_UnicodeStr_Copy (Const S : UnicodeString; Index,Size : SizeInt) : UnicodeString;compilerproc;
- var
- Lim : SizeInt;
- ResultAddress : Pointer;
- begin
- ResultAddress:=Nil;
- dec(index);
- if Index < 0 then
- Index := 0;
- Lim:=Length(S)-Index; { Cannot overflow as both Length(S) and Index are non-negative. }
- if Size>Lim then
- Size:=Lim;
- If Size>0 then
- begin
- ResultAddress:=NewUnicodeString(Size);
- Move (PUnicodeChar(S)[Index],ResultAddress^,Size*sizeof(UnicodeChar));
- PUnicodeRec(ResultAddress-UnicodeFirstOff)^.Len:=Size;
- PUnicodeChar(ResultAddress+Size*sizeof(UnicodeChar))^:=#0;
- end;
- fpc_unicodestr_decr_ref(Pointer(fpc_unicodestr_copy));
- Pointer(fpc_unicodestr_Copy):=ResultAddress;
- end;
- {$endif FPC_HAS_UNICODESTR_COPY}
- {$ifndef FPC_HAS_POS_UNICODESTR_UNICODESTR}
- {$define FPC_HAS_POS_UNICODESTR_UNICODESTR}
- Function Pos (Const Substr : UnicodeString; Const Source : UnicodeString; Offset: Sizeint = 1) : SizeInt;
- var
- i,MaxLen,nsource,nsub,d : SizeInt;
- begin
- Pos:=0;
- nsource:=Length(Source);
- nsub:=Length(Substr);
- if (nsub>0) and (Offset>0) and (Offset<=nsource) then
- begin
- MaxLen:=nsource-nsub+1;
- i:=Offset;
- while (i<=MaxLen) do
- begin
- d:=IndexWord(Source[i],MaxLen-i+1,word(Substr[1]));
- if d<0 then
- exit;
- if CompareWord(Substr[1],Source[i+d],nsub)=0 then
- exit(i+d);
- i:=i+d+1;
- end;
- end;
- end;
- {$endif FPC_HAS_POS_UNICODESTR_UNICODESTR}
- {$ifndef FPC_HAS_POS_UNICODECHAR_UNICODESTR}
- {$define FPC_HAS_POS_UNICODECHAR_UNICODESTR}
- { Faster version for a unicodechar alone }
- Function Pos (c : UnicodeChar; Const s : UnicodeString; Offset: Sizeint = 1) : SizeInt;
- var
- ns,idx: SizeInt;
- begin
- pos:=0;
- ns:=length(s);
- if (Offset>0) and (Offset<=ns) then
- begin
- idx:=IndexWord(s[Offset],ns-Offset+1,word(c));
- if idx>=0 then
- pos:=Offset+idx;
- end;
- end;
- {$endif FPC_HAS_POS_UNICODECHAR_UNICODESTR}
- { DO NOT inline these! Inlining a managed typecast creates an implicit try..finally
- block, which is significant bloat without any sensible speed improvement. }
- Function Pos (const c : RawByteString; Const s : UnicodeString; Offset: Sizeint = 1) : SizeInt;
- begin
- result:=Pos(UnicodeString(c),s,offset);
- end;
- Function Pos (const c : ShortString; Const s : UnicodeString; Offset: Sizeint = 1) : SizeInt;
- begin
- result:=Pos(UnicodeString(c),s,OffSet);
- end;
- Function Pos (const c : UnicodeString; Const s : RawByteString; Offset: Sizeint = 1) : SizeInt;
- begin
- result:=Pos(c,UnicodeString(s),OffSet);
- end;
- {$ifndef FPC_HAS_UNICODESTR_OF_CHAR}
- {$define FPC_HAS_UNICODESTR_OF_CHAR}
- Function StringOfChar(c : Unicodechar;l : SizeInt) : UnicodeString;
- begin
- SetLength(StringOfChar,l);
- FillWord(Pointer(StringOfChar)^,Length(StringOfChar),word(c));
- end;
- {$endif}
- {$ifndef FPC_HAS_POS_CHAR_UNICODESTR}
- {$define FPC_HAS_POS_CHAR_UNICODESTR}
- { Faster version for a AnsiChar alone. Must be implemented because }
- { pos(c: AnsiChar; const s: shortstring) also exists, so otherwise }
- { using pos(AnsiChar,pansichar) will always call the shortstring version }
- { (exact match for first argument), also with $h+ (JM) }
- Function Pos (c : AnsiChar; Const s : UnicodeString; Offset: Sizeint = 1) : SizeInt;
- var
- ns,idx: SizeInt;
- begin
- pos:=0;
- ns:=length(s);
- if (Offset>0) and (Offset<=ns) then
- begin
- idx:=IndexWord(s[Offset],ns-Offset+1,word(unicodechar(c)));
- if idx>=0 then
- pos:=Offset+idx;
- end;
- end;
- {$endif FPC_HAS_POS_CHAR_UNICODESTR}
- {$ifndef FPC_HAS_DELETE_UNICODESTR}
- {$define FPC_HAS_DELETE_UNICODESTR}
- Procedure {$ifdef VER3_0}Delete{$else}fpc_unicodestr_delete{$endif}(Var S : UnicodeString; Index,Size: SizeInt);
- Var
- LS : SizeInt;
- begin
- LS:=Length(S);
- if (Index>LS) or (Index<=0) or (Size<=0) then
- exit;
- UniqueString (S);
- { (Size+Index) will overflow if Size=MaxInt. }
- if Size>LS-Index then
- Size:=LS-Index+1;
- if Size<=LS-Index then
- begin
- Dec(Index);
- Move(PUnicodeChar(S)[Index+Size],PUnicodeChar(S)[Index],(LS-Index-Size+1)*sizeof(UnicodeChar));
- end;
- Setlength(s,LS-Size);
- end;
- {$endif FPC_HAS_DELETE_UNICODESTR}
- {$ifndef FPC_HAS_INSERT_UNICODESTR}
- {$define FPC_HAS_INSERT_UNICODESTR}
- Procedure {$ifdef VER3_0}Insert{$else}fpc_unicodestr_insert{$endif}(Const Source : UnicodeString; Var S : UnicodeString; Index : SizeInt);
- var
- Temp : UnicodeString;
- LS : SizeInt;
- begin
- If Length(Source)=0 then
- exit;
- if index <= 0 then
- index := 1;
- Ls:=Length(S);
- if index > LS then
- index := LS+1;
- Dec(Index);
- SetLength(Temp,Length(Source)+LS);
- If Index>0 then
- move (PUnicodeChar(S)^,PUnicodeChar(Temp)^,Index*sizeof(UnicodeChar));
- Move (PUnicodeChar(Source)^,PUnicodeChar(Temp)[Index],Length(Source)*sizeof(UnicodeChar));
- If (LS-Index)>0 then
- Move(PUnicodeChar(S)[Index],PUnicodeChar(temp)[Length(Source)+index],(LS-Index)*sizeof(UnicodeChar));
- S:=Temp;
- end;
- {$endif FPC_HAS_INSERT_UNICODESTR}
- {$ifndef FPC_HAS_UPCASE_UNICODECHAR}
- {$define FPC_HAS_UPCASE_UNICODECHAR}
- Function UpCase(c:UnicodeChar):UnicodeChar;
- begin
- Result:= widestringmanager.UpperUnicodeStringProc(UnicodeString(c))[1]
- end;
- {$endif FPC_HAS_UPCASE_UNICODECHAR}
- {$ifndef FPC_HAS_UPCASE_UNICODESTR}
- {$define FPC_HAS_UPCASE_UNICODESTR}
- function UpCase(const s : UnicodeString) : UnicodeString;
- begin
- result:=widestringmanager.UpperUnicodeStringProc(s);
- end;
- {$endif FPC_HAS_UPCASE_UNICODESTR}
- {$ifndef FPC_HAS_LOWERCASE_UNICODECHAR}
- {$define FPC_HAS_LOWERCASE_UNICODECHAR}
- Function LowerCase(c:UnicodeChar):UnicodeChar;
- begin
- Result:= widestringmanager.LowerUnicodeStringProc(UnicodeString(c))[1]
- end;
- {$endif FPC_HAS_LOWERCASE_UNICODECHAR}
- {$ifndef FPC_HAS_LOWERCASE_UNICODESTR}
- {$define FPC_HAS_LOWERCASE_UNICODESTR}
- function LowerCase(const s : UnicodeString) : UnicodeString;
- begin
- result:=widestringmanager.LowerUnicodeStringProc(s);
- end;
- {$endif FPC_HAS_LOWERCASE_UNICODESTR}
- {$ifndef FPC_HAS_SETSTRING_UNICODESTR_PUNICODECHAR}
- {$define FPC_HAS_SETSTRING_UNICODESTR_PUNICODECHAR}
- Procedure {$ifdef FPC_HAS_CPSTRING}fpc_setstring_unicodestr_pwidechar{$else}SetString{$endif}(Out S : UnicodeString; Buf : PUnicodeChar; Len : SizeInt); {$ifdef FPC_HAS_CPSTRING} compilerproc; {$endif FPC_HAS_CPSTRING}
- begin
- SetLength(S,Len);
- If (Buf<>Nil) and (Len>0) then
- Move (Buf[0],S[1],Len*sizeof(UnicodeChar));
- end;
- {$endif FPC_HAS_SETSTRING_UNICODESTR_PUNICODECHAR}
- {$ifndef FPC_HAS_SETSTRING_UNICODESTR_PCHAR}
- {$define FPC_HAS_SETSTRING_UNICODESTR_PCHAR}
- Procedure {$ifdef FPC_HAS_CPSTRING}fpc_setstring_unicodestr_pansichar{$else}SetString{$endif}(Out S : UnicodeString; Buf : PAnsiChar; Len : SizeInt); {$ifdef FPC_HAS_CPSTRING} compilerproc; {$endif FPC_HAS_CPSTRING}
- begin
- If (Buf<>Nil) and (Len>0) then
- widestringmanager.Ansi2UnicodeMoveProc(Buf,DefaultSystemCodePage,S,Len)
- else
- SetLength(S,Len);
- end;
- {$endif FPC_HAS_SETSTRING_UNICODESTR_PCHAR}
- {$ifndef FPUNONE}
- Function fpc_Val_Real_UnicodeStr(Const S : UnicodeString; out Code : ValSInt): ValReal; [public, alias:'FPC_VAL_REAL_UNICODESTR']; compilerproc;
- Var
- SS: ShortString;
- begin
- fpc_Val_Real_UnicodeStr:=0;
- if length(S)>255 then
- code:=256
- else
- begin
- SS:=ShortString(S);
- Val(SS,fpc_Val_Real_UnicodeStr,code);
- end;
- end;
- {$endif}
- {$ifndef FPC_STR_ENUM_INTERN}
- function fpc_val_enum_unicodestr(str2ordindex:pointer;const s:unicodestring;out code:valsint):longint;compilerproc;
- var
- ss: ShortString;
- begin
- if length(s)>255 then
- code:=256
- else
- begin
- ss:=ShortString(s);
- val(ss,fpc_val_enum_unicodestr,code);
- end;
- end;
- {$endif FPC_STR_ENUM_INTERN}
- Function fpc_Val_Currency_UnicodeStr(Const S : UnicodeString; out Code : ValSInt): Currency; [public, alias:'FPC_VAL_CURRENCY_UNICODESTR']; compilerproc;
- Var
- SS: ShortString;
- begin
- if length(S)>255 then
- begin
- fpc_Val_Currency_UnicodeStr:=0;
- code:=256;
- end
- else
- begin
- SS:=ShortString(S);
- Val(SS,fpc_Val_Currency_UnicodeStr,code);
- end;
- end;
- Function fpc_Val_UInt_UnicodeStr ({$ifndef VER3_2}DestSize: SizeInt;{$endif VER3_2} Const S : UnicodeString; out Code : ValSInt): ValUInt; [public, alias:'FPC_VAL_UINT_UNICODESTR']; compilerproc;
- Var
- SS: ShortString;
- begin
- fpc_Val_UInt_UnicodeStr:=0;
- if length(S)>255 then
- code:=256
- else
- begin
- SS:=ShortString(S);
- Val(SS,fpc_Val_UInt_UnicodeStr,code);
- end;
- end;
- Function fpc_Val_SInt_UnicodeStr (DestSize: SizeInt; Const S : UnicodeString; out Code : ValSInt): ValSInt; [public, alias:'FPC_VAL_SINT_UNICODESTR']; compilerproc;
- Var
- SS: ShortString;
- begin
- fpc_Val_SInt_UnicodeStr:=0;
- if length(S)>255 then
- code:=256
- else
- begin
- SS:=ShortString(S);
- fpc_Val_SInt_UnicodeStr := int_Val_SInt_ShortStr(DestSize,SS,Code);
- end;
- end;
- {$ifndef CPU64}
- Function fpc_Val_qword_UnicodeStr (Const S : UnicodeString; out Code : ValSInt): qword; [public, alias:'FPC_VAL_QWORD_UNICODESTR']; compilerproc;
- Var
- SS: ShortString;
- begin
- fpc_Val_qword_UnicodeStr:=0;
- if length(S)>255 then
- code:=256
- else
- begin
- SS:=ShortString(S);
- Val(SS,fpc_Val_qword_UnicodeStr,Code);
- end;
- end;
- Function fpc_Val_int64_UnicodeStr (Const S : UnicodeString; out Code : ValSInt): Int64; [public, alias:'FPC_VAL_INT64_UNICODESTR']; compilerproc;
- Var
- SS: ShortString;
- begin
- fpc_Val_int64_UnicodeStr:=0;
- if length(S)>255 then
- code:=256
- else
- begin
- SS:=ShortString(S);
- Val(SS,fpc_Val_int64_UnicodeStr,Code);
- end;
- end;
- {$endif CPU64}
- {$if defined(CPU16) or defined(CPU8)}
- Function fpc_Val_longword_UnicodeStr (Const S : UnicodeString; out Code : ValSInt): longword; [public, alias:'FPC_VAL_LONGWORD_UNICODESTR']; compilerproc;
- Var
- SS: ShortString;
- begin
- fpc_Val_longword_UnicodeStr:=0;
- if length(S)>255 then
- code:=256
- else
- begin
- SS:=ShortString(S);
- Val(SS,fpc_Val_longword_UnicodeStr,Code);
- end;
- end;
- Function fpc_Val_longint_UnicodeStr (Const S : UnicodeString; out Code : ValSInt): LongInt; [public, alias:'FPC_VAL_LONGINT_UNICODESTR']; compilerproc;
- Var
- SS: ShortString;
- begin
- fpc_Val_longint_UnicodeStr:=0;
- if length(S)>255 then
- code:=256
- else
- begin
- SS:=ShortString(S);
- Val(SS,fpc_Val_longint_UnicodeStr,Code);
- end;
- end;
- Function fpc_Val_word_UnicodeStr (Const S : UnicodeString; out Code : ValSInt): word; [public, alias:'FPC_VAL_WORD_UNICODESTR']; compilerproc;
- Var
- SS: ShortString;
- begin
- fpc_Val_word_UnicodeStr:=0;
- if length(S)>255 then
- code:=256
- else
- begin
- SS:=ShortString(S);
- Val(SS,fpc_Val_word_UnicodeStr,Code);
- end;
- end;
- Function fpc_Val_smallint_UnicodeStr (Const S : UnicodeString; out Code : ValSInt): SmallInt; [public, alias:'FPC_VAL_SMALLINT_UNICODESTR']; compilerproc;
- Var
- SS: ShortString;
- begin
- fpc_Val_smallint_UnicodeStr:=0;
- if length(S)>255 then
- code:=256
- else
- begin
- SS:=ShortString(S);
- Val(SS,fpc_Val_smallint_UnicodeStr,Code);
- end;
- end;
- {$endif CPU16 or CPU8}
- {$ifndef FPUNONE}
- procedure fpc_UnicodeStr_Float(d : ValReal;len,fr,rt : SizeInt;out s : UnicodeString);compilerproc;
- var
- ss: shortstring;
- begin
- str_real(len,fr,d,treal_type(rt),ss);
- s:=UnicodeString(ss);
- end;
- {$endif}
- {$ifndef FPC_STR_ENUM_INTERN}
- procedure fpc_unicodestr_enum(ordinal,len:sizeint;typinfo,ord2strindex:pointer;out s:unicodestring);compilerproc;
- var
- ss: ShortString;
- begin
- fpc_shortstr_enum(ordinal,len,typinfo,ord2strindex,ss);
- s:=UnicodeString(ss);
- end;
- {$endif FPC_STR_ENUM_INTERN}
- procedure fpc_unicodestr_bool(b : boolean;len:sizeint;out s:unicodestring);compilerproc;
- var
- ss: ShortString;
- begin
- fpc_shortstr_bool(b,len,ss);
- s:=UnicodeString(ss);
- end;
- procedure fpc_UnicodeStr_Currency(c : Currency;len,fr : SizeInt;out s : UnicodeString);compilerproc;
- var
- ss: shortstring;
- begin
- str(c:len:fr,ss);
- s:=UnicodeString(ss);
- end;
- Procedure fpc_UnicodeStr_SInt(v : ValSint; Len : SizeInt; out S : UnicodeString);compilerproc;
- Var
- SS: ShortString;
- begin
- Str (v:Len,SS);
- S:=UnicodeString(SS);
- end;
- Procedure fpc_UnicodeStr_UInt(v : ValUInt;Len : SizeInt; out S : UnicodeString);compilerproc;
- Var
- SS: ShortString;
- begin
- str(v:Len,SS);
- S:=UnicodeString(SS);
- end;
- {$ifndef CPU64}
- Procedure fpc_UnicodeStr_Int64(v : Int64; Len : SizeInt; out S : UnicodeString);compilerproc;
- Var
- SS: ShortString;
- begin
- Str (v:Len,SS);
- S:=UnicodeString(SS);
- end;
- Procedure fpc_UnicodeStr_Qword(v : Qword;Len : SizeInt; out S : UnicodeString);compilerproc;
- Var
- SS: ShortString;
- begin
- str(v:Len,SS);
- S:=UnicodeString(SS);
- end;
- {$endif CPU64}
- {$if defined(CPU16) or defined(CPU8)}
- Procedure fpc_UnicodeStr_LongInt(v : LongInt; Len : SizeInt; out S : UnicodeString);compilerproc;
- Var
- SS: ShortString;
- begin
- Str (v:Len,SS);
- S:=UnicodeString(SS);
- end;
- Procedure fpc_UnicodeStr_LongWord(v : LongWord;Len : SizeInt; out S : UnicodeString);compilerproc;
- Var
- SS: ShortString;
- begin
- str(v:Len,SS);
- S:=UnicodeString(SS);
- end;
- Procedure fpc_UnicodeStr_SmallInt(v : SmallInt; Len : SizeInt; out S : UnicodeString);compilerproc;
- Var
- SS: ShortString;
- begin
- Str (v:Len,SS);
- S:=UnicodeString(SS);
- end;
- Procedure fpc_UnicodeStr_Word(v : Word;Len : SizeInt; out S : UnicodeString);compilerproc;
- Var
- SS: ShortString;
- begin
- str(v:Len,SS);
- S:=UnicodeString(SS);
- end;
- {$endif CPU16 or CPU8}
- function UnicodeToUtf8(Dest: PAnsiChar; Source: PUnicodeChar; MaxBytes: SizeInt): SizeInt;{$ifdef SYSTEMINLINE}inline;{$endif}
- begin
- if assigned(Source) then
- Result:=UnicodeToUtf8(Dest,MaxBytes,Source,Length(Source))
- else
- Result:=0;
- end;
- function UnicodeToUtf8(Dest: PAnsiChar; MaxDestBytes: SizeUInt; Source: PUnicodeChar; SourceChars: SizeUInt): SizeUInt;
- {$ifdef EXCLUDE_COMPLEX_PROCS}
- begin
- runerror(217);
- end;
- {$else EXCLUDE_COMPLEX_PROCS}
- var
- i,j : SizeUInt;
- lw : longword;
- begin
- result:=0;
- if source=nil then
- exit;
- i:=0;
- j:=0;
- if assigned(Dest) then
- begin
- while (i<SourceChars) and (j<MaxDestBytes) do
- begin
- lw:=ord(Source[i]);
- case lw of
- 0..$7f:
- begin
- Dest[j]:=AnsiChar(lw);
- inc(j);
- end;
- $80..$7ff:
- begin
- if j+1>=MaxDestBytes then
- break;
- Dest[j]:=AnsiChar($c0 or (lw shr 6));
- Dest[j+1]:=AnsiChar($80 or (lw and $3f));
- inc(j,2);
- end;
- $800..$d7ff,$e000..$ffff:
- begin
- if j+2>=MaxDestBytes then
- break;
- Dest[j]:=AnsiChar($e0 or (lw shr 12));
- Dest[j+1]:=AnsiChar($80 or ((lw shr 6) and $3f));
- Dest[j+2]:=AnsiChar($80 or (lw and $3f));
- inc(j,3);
- end;
- $d800..$dbff:
- {High Surrogates}
- begin
- if j+3>=MaxDestBytes then
- break;
- if (i+1<sourcechars) and
- (word(Source[i+1]) >= $dc00) and
- (word(Source[i+1]) <= $dfff) then
- begin
- { $d7c0 is ($d800 - ($10000 shr 10)) }
- lw:=(longword(lw-$d7c0) shl 10) + (ord(source[i+1]) xor $dc00);
- Dest[j]:=AnsiChar($f0 or (lw shr 18));
- Dest[j+1]:=AnsiChar($80 or ((lw shr 12) and $3f));
- Dest[j+2]:=AnsiChar($80 or ((lw shr 6) and $3f));
- Dest[j+3]:=AnsiChar($80 or (lw and $3f));
- inc(j,4);
- inc(i);
- end;
- end;
- end;
- inc(i);
- end;
- if j>SizeUInt(MaxDestBytes-1) then
- j:=MaxDestBytes-1;
- Dest[j]:=#0;
- end
- else
- begin
- while i<SourceChars do
- begin
- case word(Source[i]) of
- $0..$7f:
- inc(j);
- $80..$7ff:
- inc(j,2);
- $800..$d7ff,$e000..$ffff:
- inc(j,3);
- $d800..$dbff:
- begin
- if (i+1<sourcechars) and
- (word(Source[i+1]) >= $dc00) and
- (word(Source[i+1]) <= $dfff) then
- begin
- inc(j,4);
- inc(i);
- end;
- end;
- end;
- inc(i);
- end;
- end;
- result:=j+1;
- end;
- {$endif EXCLUDE_COMPLEX_PROCS}
- function Utf8ToUnicode(Dest: PUnicodeChar; Source: PAnsiChar; MaxChars: SizeInt): SizeInt;{$ifdef SYSTEMINLINE}inline;{$endif}
- begin
- if assigned(Source) then
- Result:=Utf8ToUnicode(Dest,MaxChars,Source,length(Source),True)
- else
- Result:=0;
- end;
- function UTF8ToUnicode(Dest: PUnicodeChar; MaxDestChars: SizeUInt; Source: PAnsiChar; SourceBytes: SizeUInt): SizeUInt;{$ifdef SYSTEMINLINE}inline;{$endif}
- begin
- Result:=Utf8ToUnicode(Dest,MaxDestChars,Source,SourceBytes,True);
- end;
- function Utf8ToUnicode(Dest: PUnicodeChar; MaxDestChars: SizeUInt; Source: PAnsiChar; SourceBytes: SizeUInt; IgnoreInvalid : Boolean): SizeUInt;
- {$ifdef EXCLUDE_COMPLEX_PROCS}
- begin
- runerror(217);
- end;
- {$else EXCLUDE_COMPLEX_PROCS}
- const
- UNICODE_INVALID=63;
- var
- InputUTF8: SizeUInt;
- IBYTE: BYTE;
- OutputUnicode: SizeUInt;
- PRECHAR: SizeUInt;
- TempBYTE: BYTE;
- CharLen: SizeUint;
- LookAhead: SizeUInt;
- UC: SizeUInt;
- begin
- if not assigned(Source) then
- begin
- result:=0;
- exit;
- end;
- result:=SizeUInt(-1);
- InputUTF8:=0;
- OutputUnicode:=0;
- PreChar:=0;
- if Assigned(Dest) Then
- begin
- while (OutputUnicode<MaxDestChars) and (InputUTF8<SourceBytes) do
- begin
- IBYTE:=byte(Source[InputUTF8]);
- if (IBYTE and $80) = 0 then
- begin
- // One character US-ASCII, convert it to unicode
- // Commented code to convert LF to CRLF has been removed
- Dest[OutputUnicode]:=WideChar(IBYTE);
- inc(OutputUnicode);
- PreChar:=IBYTE;
- inc(InputUTF8);
- end
- else
- begin
- TempByte:=IBYTE;
- CharLen:=0;
- while (TempBYTE and $80)<>0 do
- begin
- TempBYTE:=(TempBYTE shl 1) and $FE;
- inc(CharLen);
- end;
- //Test for the "CharLen" conforms UTF-8 string
- //This means the 10xxxxxx pattern.
- if SizeUInt(InputUTF8+CharLen-1)>SourceBytes then
- begin
- //Insuficient chars in string to decode
- //UTF-8 array. Fallback to single AnsiChar.
- CharLen:= 1;
- end;
- for LookAhead := 1 to CharLen-1 do
- begin
- if ((byte(Source[InputUTF8+LookAhead]) and $80)<>$80) or
- ((byte(Source[InputUTF8+LookAhead]) and $40)<>$00) then
- begin
- //Invalid UTF-8 sequence, fallback.
- CharLen:= LookAhead;
- break;
- end;
- end;
- UC:=$FFFF;
- case CharLen of
- 1: begin
- //Not valid UTF-8 sequence
- UC:=UNICODE_INVALID;
- end;
- 2: begin
- //Two bytes UTF, convert it
- UC:=(byte(Source[InputUTF8]) and $1F) shl 6;
- UC:=UC or (byte(Source[InputUTF8+1]) and $3F);
- if UC <= $7F then
- begin
- //Invalid UTF sequence.
- UC:=UNICODE_INVALID;
- end;
- end;
- 3: begin
- //Three bytes, convert it to unicode
- UC:= (byte(Source[InputUTF8]) and $0F) shl 12;
- UC:= UC or ((byte(Source[InputUTF8+1]) and $3F) shl 6);
- UC:= UC or ((byte(Source[InputUTF8+2]) and $3F));
- if (UC <= $7FF) or (UC >= $FFFE) or ((UC >= $D800) and (UC <= $DFFF)) then
- begin
- //Invalid UTF-8 sequence
- UC:= UNICODE_INVALID;
- End;
- end;
- 4: begin
- //Four bytes, convert it to two unicode characters
- UC:= (byte(Source[InputUTF8]) and $07) shl 18;
- UC:= UC or ((byte(Source[InputUTF8+1]) and $3F) shl 12);
- UC:= UC or ((byte(Source[InputUTF8+2]) and $3F) shl 6);
- UC:= UC or ((byte(Source[InputUTF8+3]) and $3F));
- if (UC < $10000) or (UC > $10FFFF) then
- begin
- UC:= UNICODE_INVALID;
- end
- else
- begin
- { only store pair if room }
- dec(UC,$10000);
- if (OutputUnicode<MaxDestChars-1) then
- begin
- Dest[OutputUnicode]:=WideChar(UC shr 10 + $D800);
- inc(OutputUnicode);
- UC:=(UC and $3ff) + $DC00;
- end
- else
- begin
- InputUTF8:= InputUTF8 + CharLen;
- { don't store anything }
- CharLen:=0;
- end;
- end;
- end;
- 5,6,7: begin
- //Invalid UTF8 to unicode conversion,
- //mask it as invalid UNICODE too.
- UC:=UNICODE_INVALID;
- end;
- end;
- if CharLen > 0 then
- begin
- if (UC=UNICODE_INVALID) and Not IgnoreInvalid then
- HandleError(231); // Will be converted to EConversionError in sysutils
- PreChar:=UC;
- Dest[OutputUnicode]:=WideChar(UC);
- inc(OutputUnicode);
- end;
- InputUTF8:= InputUTF8 + CharLen;
- end;
- end;
- Result:=OutputUnicode+1;
- end
- else
- begin
- while (InputUTF8<SourceBytes) do
- begin
- IBYTE:=byte(Source[InputUTF8]);
- if (IBYTE and $80) = 0 then
- begin
- // One character US-ASCII, convert it to unicode
- // Commented code to convert LF to CRLF has been removed
- inc(OutputUnicode);
- PreChar:=IBYTE;
- inc(InputUTF8);
- end
- else
- begin
- TempByte:=IBYTE;
- CharLen:=0;
- while (TempBYTE and $80)<>0 do
- begin
- TempBYTE:=(TempBYTE shl 1) and $FE;
- inc(CharLen);
- end;
- //Test for the "CharLen" conforms UTF-8 string
- //This means the 10xxxxxx pattern.
- if SizeUInt(InputUTF8+CharLen-1)>SourceBytes then
- begin
- //Insuficient chars in string to decode
- //UTF-8 array. Fallback to single AnsiChar.
- CharLen:= 1;
- end;
- for LookAhead := 1 to CharLen-1 do
- begin
- if ((byte(Source[InputUTF8+LookAhead]) and $80)<>$80) or
- ((byte(Source[InputUTF8+LookAhead]) and $40)<>$00) then
- begin
- //Invalid UTF-8 sequence, fallback.
- CharLen:= LookAhead;
- break;
- end;
- end;
- UC:=$FFFF;
- case CharLen of
- 1: begin
- //Not valid UTF-8 sequence
- UC:=UNICODE_INVALID;
- end;
- 2: begin
- //Two bytes UTF, convert it
- UC:=(byte(Source[InputUTF8]) and $1F) shl 6;
- UC:=UC or (byte(Source[InputUTF8+1]) and $3F);
- if UC <= $7F then
- begin
- //Invalid UTF sequence.
- UC:=UNICODE_INVALID;
- end;
- end;
- 3: begin
- //Three bytes, convert it to unicode
- UC:= (byte(Source[InputUTF8]) and $0F) shl 12;
- UC:= UC or ((byte(Source[InputUTF8+1]) and $3F) shl 6);
- UC:= UC or ((byte(Source[InputUTF8+2]) and $3F));
- If (UC <= $7FF) or (UC >= $FFFE) or ((UC >= $D800) and (UC <= $DFFF)) then
- begin
- //Invalid UTF-8 sequence
- UC:= UNICODE_INVALID;
- end;
- end;
- 4: begin
- //Four bytes, convert it to two unicode characters
- UC:= (byte(Source[InputUTF8]) and $07) shl 18;
- UC:= UC or ((byte(Source[InputUTF8+1]) and $3F) shl 12);
- UC:= UC or ((byte(Source[InputUTF8+2]) and $3F) shl 6);
- UC:= UC or ((byte(Source[InputUTF8+3]) and $3F));
- if (UC < $10000) or (UC > $10FFFF) then
- UC:= UNICODE_INVALID
- else
- { extra character character }
- inc(OutputUnicode);
- end;
- 5,6,7: begin
- //Invalid UTF8 to unicode conversion,
- //mask it as invalid UNICODE too.
- UC:=UNICODE_INVALID;
- end;
- end;
- if CharLen > 0 then
- begin
- if (UC=UNICODE_INVALID) and Not IgnoreInvalid then
- HandleError(231); // Will be converted to EConversionError in sysutils
- PreChar:=UC;
- inc(OutputUnicode);
- end;
- InputUTF8:= InputUTF8 + CharLen;
- end;
- end;
- Result:=OutputUnicode+1;
- end;
- end;
- {$endif EXCLUDE_COMPLEX_PROCS}
- function UTF8Encode(const s : RawByteString) : RawByteString; inline;
- begin
- Result:=UTF8Encode(UnicodeString(s));
- end;
- {$ifndef FPC_HAS_UTF8ENCODE_UNICODESTRING}
- {$define FPC_HAS_UTF8ENCODE_UNICODESTRING}
- function UTF8Encode(const s : UnicodeString) : RawByteString;
- var
- i : SizeInt;
- hs : UTF8String;
- begin
- result:='';
- if Length(s)=0 then
- exit;
- SetLength(hs,length(s)*3);
- i:=UnicodeToUtf8(pansichar(hs),length(hs)+1,PUnicodeChar(s),length(s));
- if i>0 then
- begin
- SetLength(hs,i-1);
- result:=hs;
- end;
- end;
- {$endif FPC_HAS_UTF8ENCODE_UNICODESTRING}
- {$ifndef FPC_HAS_UTF8DECODE_UNICODESTRING}
- {$define FPC_HAS_UTF8DECODE_UNICODESTRING}
- function UTF8Decode(const s : RawByteString): UnicodeString;
- var
- i : SizeInt;
- hs : UnicodeString;
- begin
- result:='';
- if Length(s)=0 then
- exit;
- SetLength(hs,length(s));
- i:=Utf8ToUnicode(PUnicodeChar(hs),length(hs)+1,pansichar(s),length(s));
- if i>0 then
- begin
- SetLength(hs,i-1);
- result:=hs;
- end;
- end;
- {$endif FPC_HAS_UTF8DECODE_UNICODESTRING}
- function AnsiToUtf8(const s : RawByteString): RawByteString;{$ifdef SYSTEMINLINE}inline;{$endif}
- begin
- Result:=Utf8Encode(s);
- end;
- function Utf8ToAnsi(const s : RawByteString) : RawByteString;{$ifdef SYSTEMINLINE}inline;{$endif}
- begin
- Result:=RawByteString(Utf8Decode(s));
- end;
- {$ifdef FPC_HAS_FEATURE_DYNARRAYS}
- procedure UCS4Encode(p: PWideChar; len: sizeint; out res: UCS4String);
- var
- i, reslen: sizeint;
- w: longint;
- begin
- reslen:=0;
- i:=0;
- { calculate required length }
- while (i<len) do
- begin
- if (p[i]<=#$d7ff) or (p[i]>=#$e000) then
- inc(i)
- else if (p[i]<=#$dbff) and
- (i+1<len) and
- (p[i+1]>=#$dc00) and
- (p[i+1]<=#$dfff) then
- inc(i,2)
- else
- inc(i);
- inc(reslen);
- end;
- SetLength(res,reslen+1); { +1 for null termination }
- reslen:=0;
- i:=0;
- { do conversion }
- while (i<len) do
- begin
- w:=ord(p[i]);
- if (w<=$d7ff) or (w>=$e000) then
- res[reslen]:=w
- else if (w<=$dbff) and
- (i+1<len) and
- (p[i+1]>=#$dc00) and
- (p[i+1]<=#$dfff) then
- begin
- res[reslen]:=(UCS4Char(w-$d7c0) shl 10)+(UCS4Char(p[i+1]) xor $dc00);
- inc(i);
- end
- else { invalid surrogate pair }
- res[reslen]:=w;
- inc(i);
- inc(reslen);
- end;
- res[reslen]:=0;
- end;
- {$ifndef FPC_HAS_UCS4STRING_TO_UNICODESTR}
- {$define FPC_HAS_UCS4STRING_TO_UNICODESTR}
- function UnicodeStringToUCS4String(const s : UnicodeString) : UCS4String;
- begin
- UCS4Encode(PWideChar(s),Length(s),result);
- end;
- {$endif FPC_HAS_UCS4STRING_TO_UNICODESTR}
- {$ifndef FPC_HAS_WIDESTR_TO_UCS4STRING}
- {$define FPC_HAS_WIDESTR_TO_UCS4STRING}
- function WideStringToUCS4String(const s : WideString) : UCS4String;
- begin
- UCS4Encode(PWideChar(s),Length(s),result);
- end;
- {$endif FPC_HAS_WIDESTR_TO_UCS4STRING}
- {$ifndef FPC_HAS_UCS4STRING_TO_WIDESTR}
- {$define FPC_HAS_UCS4STRING_TO_WIDESTR}
- { dest should point to previously allocated wide/unicodestring }
- procedure UCS4Decode(const s: UCS4String; dest: PWideChar);
- var
- i: sizeint;
- nc: UCS4Char;
- begin
- for i:=0 to length(s)-2 do { -2 because s contains explicit terminating #0 }
- begin
- nc:=s[i];
- if (nc<=$ffff) then
- dest^:=widechar(nc)
- else if (dword(nc)<=$10ffff) then
- begin
- dest^:=widechar(nc shr 10 + $d7c0);
- { subtracting $10000 doesn't change low 10 bits }
- dest[1]:=widechar(nc and $3ff + $dc00);
- inc(dest);
- end
- else { invalid code point }
- dest^:='?';
- inc(dest);
- end;
- end;
- function UCS4StringToUnicodeString(const s : UCS4String) : UnicodeString;
- var
- i : SizeInt;
- reslen : SizeInt;
- begin
- reslen:=0;
- for i:=0 to length(s)-2 do { skip terminating #0 }
- Inc(reslen,1+ord((s[i]>$ffff) and (cardinal(s[i])<=$10ffff)));
- SetLength(result,reslen);
- UCS4Decode(s,pointer(result));
- end;
- function UCS4StringToWideString(const s : UCS4String) : WideString;
- var
- i : SizeInt;
- reslen : SizeInt;
- begin
- reslen:=0;
- for i:=0 to length(s)-2 do { skip terminating #0 }
- Inc(reslen,1+ord((s[i]>$ffff) and (cardinal(s[i])<=$10ffff)));
- SetLength(result,reslen);
- UCS4Decode(s,pointer(result));
- end;
- {$endif FPC_HAS_UCS4STRING_TO_WIDESTR}
- {$endif FPC_HAS_FEATURE_DYNARRAYS}
- {$ifndef FPC_HAS_BUILTIN_WIDESTR_MANAGER}
- const
- SNoUnicodestrings = 'This binary has no string conversion support compiled in.';
- SRecompileWithUnicodestrings = 'Recompile the application with a unit that installs a unicodestring manager in the program uses clause.';
- procedure unimplementedunicodestring;
- begin
- {$ifdef FPC_HAS_FEATURE_CONSOLEIO}
- {$ifndef HAS_WIDESTRINGMANAGER}
- {$ifndef FPC_SYSTEM_NO_VERBOSE_UNICODEERROR}
- If IsConsole then
- begin
- Writeln(StdErr,SNoUnicodestrings);
- Writeln(StdErr,SRecompileWithUnicodestrings);
- end;
- {$endif FPC_SYSTEM_NO_VERBOSE_UNICODEERROR}
- {$endif HAS_WIDESTRINGMANAGER}
- {$endif FPC_HAS_FEATURE_CONSOLEIO}
- HandleErrorAddrFrameInd(234{RuntimeErrorExitCodes[reCodesetConversion]},get_pc_addr,get_frame);
- end;
- function StringElementSize(const S: UnicodeString): Word; overload;
- begin
- if assigned(Pointer(S)) then
- Result:=PUnicodeRec(pointer(S)-UnicodeFirstOff)^.ElementSize
- else
- Result:=SizeOf(UnicodeChar);
- end;
- function StringRefCount(const S: UnicodeString): SizeInt; overload;
- begin
- if assigned(Pointer(S)) then
- Result:=PUnicodeRec(pointer(S)-UnicodeFirstOff)^.Ref
- else
- Result:=0;
- end;
- function StringCodePage(const S: UnicodeString): TSystemCodePage; overload;
- begin
- {$ifdef FPC_HAS_CPSTRING}
- if assigned(Pointer(S)) then
- Result:=PUnicodeRec(pointer(S)-UnicodeFirstOff)^.CodePage
- else
- {$endif FPC_HAS_CPSTRING}
- Result:=DefaultUnicodeCodePage;
- end;
- {$push}
- {$warnings off}
- function StubUnicodeCase(const s : UnicodeString) : UnicodeString;
- begin
- unimplementedunicodestring;
- end;
- function StubCompareUnicodeString(const s1, s2 : UnicodeString; Options : TCompareOptions) : PtrInt;
- begin
- unimplementedunicodestring;
- end;
- function StubWideCase(const s: WideString): WideString;
- begin
- unimplementedunicodestring;
- end;
- function StubCompareWideString(const s1, s2 : WideString; Options : TCompareOptions) : PtrInt;
- begin
- unimplementedunicodestring;
- end;
- {$pop}
- procedure initunicodestringmanager;
- begin
- {$ifndef HAS_WIDESTRINGMANAGER}
- widestringmanager:=Default(TUnicodeStringManager);
- {$ifdef FPC_WIDESTRING_EQUAL_UNICODESTRING}
- widestringmanager.Ansi2WideMoveProc:=@defaultAnsi2UnicodeMove;
- {$else FPC_WIDESTRING_EQUAL_UNICODESTRING}
- widestringmanager.Ansi2WideMoveProc:=@DefaultAnsi2WideMove;
- {$endif FPC_WIDESTRING_EQUAL_UNICODESTRING}
- widestringmanager.Wide2AnsiMoveProc:=@DefaultUnicode2AnsiMove;
- widestringmanager.UpperWideStringProc:=@StubWideCase;
- widestringmanager.LowerWideStringProc:=@StubWideCase;
- widestringmanager.Unicode2AnsiMoveProc:=@DefaultUnicode2AnsiMove;
- widestringmanager.Ansi2UnicodeMoveProc:=@DefaultAnsi2UnicodeMove;
- widestringmanager.UpperUnicodeStringProc:=@StubUnicodeCase;
- widestringmanager.LowerUnicodeStringProc:=@StubUnicodeCase;
- widestringmanager.GetStandardCodePageProc:=@DefaultGetStandardCodePage;
- {$endif HAS_WIDESTRINGMANAGER}
- widestringmanager.CompareWideStringProc:=@StubCompareWideString;
- // widestringmanager.CompareTextWideStringProc:=@StubCompareWideString;
- widestringmanager.CompareUnicodeStringProc:=@StubCompareUnicodeString;
- widestringmanager.CharLengthPCharProc:=@DefaultCharLengthPChar;
- widestringmanager.CodePointLengthProc:=@DefaultCodePointLength;
- end;
- {$endif FPC_HAS_BUILTIN_WIDESTR_MANAGER}
- {$ifndef FPC_HAS_TOSINGLEBYTEFILESYSTEMENCODEDFILENAME_UNICODESTRING}
- {$define FPC_HAS_TOSINGLEBYTEFILESYSTEMENCODEDFILENAME_UNICODESTRING}
- Function ToSingleByteFileSystemEncodedFileName(const Str: UnicodeString): RawByteString;
- Begin
- widestringmanager.Unicode2AnsiMoveProc(punicodechar(Str),Result,
- DefaultFileSystemCodePage,Length(Str));
- End;
- {$endif FPC_HAS_TOSINGLEBYTEFILESYSTEMENCODEDFILENAME_UNICODESTRING}
- {$ifndef FPC_HAS_TOSINGLEBYTEFILESYSTEMENCODEDFILENAME_UNICODECHARARRAY}
- {$define FPC_HAS_TOSINGLEBYTEFILESYSTEMENCODEDFILENAME_UNICODECHARARRAY}
- Function ToSingleByteFileSystemEncodedFileName(const arr: array of widechar): RawByteString;
- Begin
- widestringmanager.Unicode2AnsiMoveProc(@arr[0],Result,
- DefaultFileSystemCodePage,length(pwidechar(@arr[0])));
- End;
- {$endif FPC_HAS_TOSINGLEBYTEFILESYSTEMENCODEDFILENAME_UNICODECHARARRAY}
- Function ToSingleByteFileSystemEncodedFileName(const Str: RawByteString): RawByteString;
- Begin
- Result:=Str;
- SetCodePage(Result,DefaultFileSystemCodePage,True);
- End;
- { Delphi compatibility: always interpret the data in the string as UTF-8,
- ignore any codepage }
- function UTF8ToString(const S: RawByteString): UnicodeString; inline;
- begin
- Result := UTF8Decode(S);
- end;
- function UTF8ToUnicodeString(const s : RawByteString): UnicodeString;
- begin
- Result := UTF8Decode(S);
- end;
- function UTF8ToString(const S: ShortString): UnicodeString;
- Var
- rs: RawByteString;
- begin
- rs:=S;
- Result := UTF8Decode(rs);
- end;
- function UTF8ToUnicodeString(const S: ShortString): unicodestring;
- begin
- Result:=UTF8ToString(S);
- end;
- function UTF8ToString(const S: PAnsiChar): UnicodeString;
- var
- rs: RawByteString;
- Count: Integer;
- begin
- Count := length(S);
- SetLength(rs, Count);
- if Count > 0 then
- fpc_pchar_ansistr_intern_charmove(S,0,rs,0,Count);
- Result := UTF8ToString(rs);
- end;
- function UTF8ToUnicodeString(const S: PAnsiChar): unicodestring;
- begin
- Result:=UTF8ToString(S);
- end;
- { byte and ansichar are the same on the JVM, and "array of" and "pointer to"
- are as well }
- {$ifndef CPUJVM}
- function UTF8ToString(const S: array of AnsiChar): UnicodeString;
- var
- rs: RawByteString;
- Count: Integer;
- begin
- Count := Length(S);
- SetLength(rs, Count);
- if Count > 0 then
- fpc_pchar_ansistr_intern_charmove(@S,Low(S),rs,0,Count);
- Result := UTF8ToString(rs);
- end;
- function UTF8ToString(const S: array of Byte): UnicodeString;
- var
- rs: RawByteString;
- Count: Integer;
- begin
- Count := Length(S);
- SetLength(rs, Count);
- if Count > 0 then
- fpc_pchar_ansistr_intern_charmove(pansichar(@S),Low(S),rs,0,Count);
- Result := UTF8ToString(rs);
- end;
- {$endif not CPUJVM}
- Function LocaleNameToCodePage(const localename : shortstring; out codepage : TSystemCodePage) : Boolean;
- begin
- Result:=(localename='UTF-8') or (localename='UTF8');
- if Result then
- CodePage:=CP_UTF8
- else
- begin
- Result:=(localename='UTF-7') or (localename='UTF7');
- if Result then
- CodePage:=CP_UTF7
- else
- begin
- Result:=Assigned(LocaleNameToCodePageCallBack);
- If Result then
- LocaleNameToCodePageCallBack(LocaleName,CodePage,Result);
- end;
- end;
- end;
|