2
0

ustrings.inc 67 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937193819391940194119421943194419451946194719481949195019511952195319541955195619571958195919601961196219631964196519661967196819691970197119721973197419751976197719781979198019811982198319841985198619871988198919901991199219931994199519961997199819992000200120022003200420052006200720082009201020112012201320142015201620172018201920202021202220232024202520262027202820292030203120322033203420352036203720382039204020412042204320442045204620472048204920502051205220532054205520562057205820592060206120622063206420652066206720682069207020712072207320742075207620772078207920802081208220832084208520862087208820892090209120922093209420952096209720982099210021012102210321042105210621072108210921102111211221132114211521162117211821192120212121222123212421252126212721282129213021312132213321342135213621372138213921402141214221432144214521462147214821492150215121522153215421552156215721582159216021612162216321642165216621672168216921702171217221732174217521762177217821792180218121822183218421852186218721882189219021912192219321942195219621972198219922002201220222032204220522062207220822092210221122122213221422152216221722182219222022212222222322242225222622272228222922302231223222332234223522362237223822392240224122422243224422452246224722482249225022512252225322542255225622572258225922602261226222632264226522662267226822692270227122722273227422752276227722782279228022812282228322842285228622872288228922902291229222932294229522962297229822992300
  1. {
  2. This file is part of the Free Pascal run time library.
  3. Copyright (c) 1999-2005 by Florian Klaempfl,
  4. member of the Free Pascal development team.
  5. This file implements support routines for UTF-8 strings with FPC
  6. See the file COPYING.FPC, included in this distribution,
  7. for details about the copyright.
  8. This program is distributed in the hope that it will be useful,
  9. but WITHOUT ANY WARRANTY; without even the implied warranty of
  10. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
  11. **********************************************************************}
  12. {$ifndef FPC_UNICODESTRING_TYPE_DEFINED}
  13. {$define FPC_UNICODESTRING_TYPE_DEFINED}
  14. {
  15. This file contains the implementation of the UnicodeString type,
  16. and all things that are needed for it.
  17. UnicodeString is defined as a 'silent' punicodechar :
  18. a punicodechar that points to (S= SizeOf(SizeInt), R= (if CPU64 then SizeOf(Longint) else SizeOf(SizeInt))):
  19. @-S-R : Reference count (R bytes)
  20. @-S : SizeInt for size; size=number of chars. Multiply with
  21. sizeof(UnicodeChar) to get the number of bytes. This is compatible with Delphi.
  22. @ : String + Terminating #0;
  23. Punicodechar(Unicodestring) is a valid typecast.
  24. So WS[i] is converted to the address @WS+i-1.
  25. Constants should be assigned a reference count of -1
  26. Meaning that they can't be disposed of.
  27. }
  28. Type
  29. PUnicodeRec = ^TUnicodeRec;
  30. TUnicodeRec = Record
  31. CodePage : TSystemCodePage;
  32. ElementSize : Word;
  33. {$if not defined(VER3_2)}
  34. {$ifdef CPU64}
  35. Ref : Longint;
  36. {$else}
  37. Ref : SizeInt;
  38. {$endif}
  39. {$else}
  40. {$ifdef CPU64}
  41. { align fields }
  42. Dummy : DWord;
  43. {$endif CPU64}
  44. Ref : SizeInt;
  45. {$endif}
  46. Len : SizeInt;
  47. end;
  48. Const
  49. UnicodeFirstOff = SizeOf(TUnicodeRec);
  50. {$endif FPC_UNICODESTRING_TYPE_DEFINED}
  51. {
  52. Default UnicodeChar <-> AnsiChar conversion is to only convert the
  53. lower 127 chars, all others are translated to '?'.
  54. These routines can be overridden for the Current Locale
  55. }
  56. {$ifndef FPC_HAS_DEFAULT_UNICODE_2_ANSI_MOVE}
  57. {$define FPC_HAS_DEFAULT_UNICODE_2_ANSI_MOVE}
  58. procedure DefaultUnicode2AnsiMove(source:punicodechar;var dest:RawByteString;cp : TSystemCodePage;len:SizeInt);
  59. var
  60. i : SizeInt;
  61. p : PAnsiChar;
  62. begin
  63. setlength(dest,len);
  64. if not assigned(pointer(dest)) then
  65. exit;
  66. SetCodePage(dest,cp,false);
  67. p:=pointer(dest); {SetLength guarantees that dest is unique}
  68. for i:=1 to len do
  69. begin
  70. if word(source^)<256 then
  71. p^:=AnsiChar(word(source^))
  72. else
  73. p^:='?';
  74. inc(source);
  75. inc(p);
  76. end;
  77. end;
  78. {$endif FPC_HAS_DEFAULT_UNICODE_2_ANSI_MOVE}
  79. {$ifndef FPC_HAS_DEFAULT_ANSI_2_UNICODE}
  80. {$define FPC_HAS_DEFAULT_ANSI_2_UNICODE}
  81. procedure DefaultAnsi2UnicodeMove(source:pansichar;cp : TSystemCodePage;var dest:unicodestring;len:SizeInt);
  82. var
  83. i : SizeInt;
  84. p : PUnicodeChar;
  85. begin
  86. setlength(dest,len);
  87. p:=pointer(dest); {SetLength guarantees that dest is unique}
  88. for i:=1 to len do
  89. begin
  90. p^:=unicodechar(byte(source^));
  91. inc(source);
  92. inc(p);
  93. end;
  94. end;
  95. {$endif FPC_HAS_DEFAULT_ANSI_2_UNICODE}
  96. {$ifndef FPC_HAS_BUILTIN_WIDESTR_MANAGER}
  97. function DefaultCharLengthPChar(const Str: PAnsiChar): PtrInt;
  98. begin
  99. DefaultCharLengthPChar:=length(Str);
  100. end;
  101. function DefaultCodePointLength(const Str: PAnsiChar; MaxLookAead: PtrInt): Ptrint;
  102. begin
  103. if str[0]<>#0 then
  104. DefaultCodePointLength:=1
  105. else
  106. DefaultCodePointLength:=0;
  107. end;
  108. {$endif FPC_HAS_BUILTIN_WIDESTR_MANAGER}
  109. function DefaultGetStandardCodePage(const stdcp: TStandardCodePageEnum): TSystemCodePage;
  110. begin
  111. { don't raise an exception here. We need this for text file handling }
  112. if stdcp<>scpFileSystemSingleByte then
  113. Result:=DefaultSystemCodePage
  114. else
  115. { we could return UTF-8 here in case of FPCRTL_FILESYSTEM_UTF8, but
  116. without a fully functional widestring manager that will probably cause
  117. more problems that it solves }
  118. Result:=DefaultFileSystemCodePage
  119. end;
  120. Procedure GetUnicodeStringManager (Out Manager : TUnicodeStringManager);
  121. begin
  122. manager:=widestringmanager;
  123. end;
  124. Procedure SetUnicodeStringManager (Const New : TUnicodeStringManager; Out Old: TUnicodeStringManager);
  125. begin
  126. Old:=widestringmanager;
  127. widestringmanager:=New;
  128. end;
  129. Procedure SetUnicodeStringManager (Const New : TUnicodeStringManager);
  130. begin
  131. widestringmanager:=New;
  132. end;
  133. Procedure GetWideStringManager (out Manager : TUnicodeStringManager);
  134. begin
  135. manager:=widestringmanager;
  136. end;
  137. Procedure SetWideStringManager (Const New : TUnicodeStringManager; Out old: TUnicodeStringManager);
  138. begin
  139. Old:=widestringmanager;
  140. widestringmanager:=New;
  141. end;
  142. Procedure SetWideStringManager (Const New : TUnicodeStringManager);
  143. begin
  144. widestringmanager:=New;
  145. end;
  146. {****************************************************************************
  147. Internal functions, not in interface.
  148. ****************************************************************************}
  149. {$ifndef FPC_HAS_UNICODESTR_DECR_REF}
  150. {$define FPC_HAS_UNICODESTR_DECR_REF}
  151. Procedure fpc_UnicodeStr_Decr_Ref (Var S : Pointer);[Public,Alias:'FPC_UNICODESTR_DECR_REF']; compilerproc;
  152. {
  153. Decreases the ReferenceCount of a non constant unicodestring;
  154. If the reference count is zero, deallocate the string;
  155. }
  156. Var
  157. p: pointer;
  158. Begin
  159. p:=S;
  160. If p=Nil then
  161. exit;
  162. s:=nil;
  163. If (PUnicodeRec(p-UnicodeFirstOff)^.ref=1) or { Shortcut declocked on ref = 1. }
  164. (PUnicodeRec(p-UnicodeFirstOff)^.ref>0) { ref = -1 is constant string. }
  165. and declocked(PUnicodeRec(p-UnicodeFirstOff)^.ref) then
  166. FreeMem(p-UnicodeFirstOff);
  167. end;
  168. { alias for internal use }
  169. Procedure fpc_UnicodeStr_Decr_Ref (Var S : Pointer);[external name 'FPC_UNICODESTR_DECR_REF'];
  170. {$endif FPC_HAS_UNICODESTR_DECR_REF}
  171. {$ifndef FPC_HAS_UNICODESTR_INCR_REF}
  172. {$define FPC_HAS_UNICODESTR_INCR_REF}
  173. Procedure fpc_UnicodeStr_Incr_Ref(S : Pointer);[Public,Alias:'FPC_UNICODESTR_INCR_REF']; compilerproc;
  174. Begin
  175. If S=Nil then
  176. exit;
  177. { constant string ? }
  178. If PUnicodeRec(S-UnicodeFirstOff)^.Ref<0 then
  179. exit;
  180. inclocked(PUnicodeRec(S-UnicodeFirstOff)^.Ref);
  181. end;
  182. { alias for internal use }
  183. Procedure fpc_UnicodeStr_Incr_Ref (S : Pointer);[external name 'FPC_UNICODESTR_INCR_REF'];
  184. {$endif FPC_HAS_UNICODESTR_INCR_REF}
  185. {$ifndef FPC_HAS_UNICODESTR_TO_SHORTSTR}
  186. {$define FPC_HAS_UNICODESTR_TO_SHORTSTR}
  187. procedure fpc_UnicodeStr_To_ShortStr (out res: ShortString;const S2 : UnicodeString); [Public, alias: 'FPC_UNICODESTR_TO_SHORTSTR'];compilerproc;
  188. {
  189. Converts a UnicodeString to a ShortString;
  190. }
  191. Var
  192. Size : SizeInt;
  193. temp : ansistring;
  194. begin
  195. res:='';
  196. Size:=Length(S2);
  197. if Size>0 then
  198. begin
  199. If Size>high(res) then
  200. Size:=high(res);
  201. widestringmanager.Unicode2AnsiMoveProc(PUnicodeChar(Pointer(S2)),temp,DefaultSystemCodePage,Size);
  202. res:=temp;
  203. end;
  204. end;
  205. {$endif FPC_HAS_UNICODESTR_TO_SHORTSTR}
  206. {$ifndef FPC_HAS_SHORTSTR_TO_UNICODESTR}
  207. {$define FPC_HAS_SHORTSTR_TO_UNICODESTR}
  208. Function fpc_ShortStr_To_UnicodeStr (Const S2 : ShortString): UnicodeString;compilerproc;
  209. {
  210. Converts a ShortString to a UnicodeString;
  211. }
  212. Var
  213. Size : SizeInt;
  214. begin
  215. result:='';
  216. Size:=Length(S2);
  217. if Size>0 then
  218. widestringmanager.Ansi2UnicodeMoveProc(PAnsiChar(@S2[1]),DefaultSystemCodePage,result,Size);
  219. end;
  220. {$endif FPC_HAS_SHORTSTR_TO_UNICODESTR}
  221. {$ifndef FPC_HAS_UNICODESTR_TO_ANSISTR}
  222. {$define FPC_HAS_UNICODESTR_TO_ANSISTR}
  223. Function fpc_UnicodeStr_To_AnsiStr (const S2 : UnicodeString;cp : TSystemCodePage): AnsiString; compilerproc;
  224. {
  225. Converts a UnicodeString to an AnsiString
  226. }
  227. Var
  228. Size : SizeInt;
  229. begin
  230. result:='';
  231. Size:=Length(S2);
  232. if Size>0 then
  233. widestringmanager.Unicode2AnsiMoveProc(PUnicodeChar(Pointer(S2)),result,TranslatePlaceholderCP(cp),Size);
  234. end;
  235. {$endif FPC_HAS_UNICODESTR_TO_ANSISTR}
  236. {$ifndef FPC_HAS_ANSISTR_TO_UNICODESTR}
  237. {$define FPC_HAS_ANSISTR_TO_UNICODESTR}
  238. Function fpc_AnsiStr_To_UnicodeStr (Const S2 : RawByteString): UnicodeString; compilerproc;
  239. {
  240. Converts an AnsiString to a UnicodeString;
  241. }
  242. Var
  243. Size : SizeInt;
  244. cp: TSystemCodePage;
  245. begin
  246. result:='';
  247. Size:=Length(S2);
  248. if Size>0 then
  249. begin
  250. cp:=TranslatePlaceholderCP(StringCodePage(S2));
  251. widestringmanager.Ansi2UnicodeMoveProc(PAnsiChar(S2),cp,result,Size);
  252. end;
  253. end;
  254. {$endif FPC_HAS_ANSISTR_TO_UNICODESTR}
  255. {$ifndef FPC_HAS_UNICODESTR_TO_WIDESTR}
  256. {$define FPC_HAS_UNICODESTR_TO_WIDESTR}
  257. Function fpc_UnicodeStr_To_WideStr (const S2 : UnicodeString): WideString; compilerproc;
  258. begin
  259. SetLength(Result,Length(S2));
  260. Move(pointer(S2)^,Pointer(Result)^,Length(S2)*sizeof(WideChar));
  261. end;
  262. {$endif FPC_HAS_UNICODESTR_TO_WIDESTR}
  263. {$ifndef FPC_HAS_WIDESTR_TO_UNICODESTR}
  264. {$define FPC_HAS_WIDESTR_TO_UNICODESTR}
  265. Function fpc_WideStr_To_UnicodeStr (Const S2 : WideString): UnicodeString; compilerproc;
  266. begin
  267. SetLength(Result,Length(S2));
  268. Move(pointer(S2)^,Pointer(Result)^,Length(S2)*sizeof(WideChar));
  269. end;
  270. {$endif FPC_HAS_WIDESTR_TO_UNICODESTR}
  271. {$ifndef FPC_HAS_PWIDECHAR_TO_UNICODESTR}
  272. {$define FPC_HAS_PWIDECHAR_TO_UNICODESTR}
  273. Function fpc_PWideChar_To_UnicodeStr(const p : pwidechar): unicodestring; compilerproc;
  274. var
  275. Size : SizeInt;
  276. begin
  277. result:='';
  278. if p=nil then
  279. exit;
  280. Size := IndexWord(p^, -1, 0);
  281. Setlength(result,Size);
  282. if Size>0 then
  283. Move(p^,PUnicodeChar(Pointer(result))^,Size*sizeof(UnicodeChar));
  284. end;
  285. {$endif FPC_HAS_PWIDECHAR_TO_UNICODESTR}
  286. {$ifndef FPC_HAS_PWIDECHAR_TO_ANSISTR}
  287. {$define FPC_HAS_PWIDECHAR_TO_ANSISTR}
  288. Function fpc_PWideChar_To_AnsiStr(const p : pwidechar;cp : TSystemCodePage): ansistring; compilerproc;
  289. var
  290. Size : SizeInt;
  291. begin
  292. result:='';
  293. if p=nil then
  294. exit;
  295. Size := IndexWord(p^, -1, 0);
  296. if Size>0 then
  297. widestringmanager.Wide2AnsiMoveProc(P,result,TranslatePlaceholderCP(cp),Size);
  298. end;
  299. {$endif FPC_HAS_PWIDECHAR_TO_ANSISTR}
  300. {$ifndef FPC_HAS_PWIDECHAR_TO_SHORTSTR}
  301. {$define FPC_HAS_PWIDECHAR_TO_SHORTSTR}
  302. procedure fpc_PWideChar_To_ShortStr(out res : shortstring;const p : pwidechar); compilerproc;
  303. var
  304. Size : SizeInt;
  305. temp: ansistring;
  306. begin
  307. res:='';
  308. if p=nil then
  309. exit;
  310. Size:=IndexWord(p^, high(PtrInt), 0);
  311. if Size>0 then
  312. begin
  313. widestringmanager.Wide2AnsiMoveProc(p,temp,DefaultSystemCodePage,Size);
  314. res:=temp;
  315. end;
  316. end;
  317. {$endif FPC_HAS_PWIDECHAR_TO_SHORTSTR}
  318. {$ifndef FPC_HAS_UNICODESTR_ASSIGN}
  319. {$define FPC_UNICODESTR_ASSIGN}
  320. { checked against the ansistring routine, 2001-05-27 (FK) }
  321. Procedure fpc_UnicodeStr_Assign (Var S1 : Pointer;S2 : Pointer);[Public,Alias:'FPC_UNICODESTR_ASSIGN']; compilerproc;
  322. {
  323. Assigns S2 to S1 (S1:=S2), taking in account reference counts.
  324. }
  325. begin
  326. If S2<>nil then
  327. If PUnicodeRec(S2-UnicodeFirstOff)^.Ref>0 then
  328. inclocked(PUnicodeRec(S2-UnicodeFirstOff)^.ref);
  329. { Decrease the reference count on the old S1 }
  330. fpc_unicodestr_decr_ref (S1);
  331. s1:=s2;
  332. end;
  333. { alias for internal use }
  334. Procedure fpc_UnicodeStr_Assign (Var S1 : Pointer;S2 : Pointer);[external name 'FPC_UNICODESTR_ASSIGN'];
  335. {$endif FPC_UNICODESTR_ASSIGN}
  336. {$ifndef FPC_HAS_UNICODESTR_CONCAT}
  337. {$define FPC_HAS_UNICODESTR_CONCAT}
  338. procedure fpc_UnicodeStr_Concat (var DestS:Unicodestring;const S1,S2 : UnicodeString); compilerproc;
  339. Var
  340. S1Len,S2Len : SizeInt;
  341. OldDestP,NewDestP,RealDestP,Src : Pointer;
  342. begin
  343. { only assign if s1 or s2 is empty }
  344. if Length(S1)=0 then
  345. begin
  346. DestS:=s2;
  347. exit;
  348. end;
  349. if Length(S2)=0 then
  350. begin
  351. DestS:=s1;
  352. exit;
  353. end;
  354. S1Len:=PUnicodeRec(Pointer(S1)-UnicodeFirstOff)^.Len;
  355. S2Len:=PUnicodeRec(Pointer(S2)-UnicodeFirstOff)^.Len;
  356. OldDestP:=Pointer(DestS);
  357. { Reallocate when possible; in the hope this will reuse the chunk more often than do a redundant copy. }
  358. if Assigned(OldDestP) and (PUnicodeRec(OldDestP-UnicodeFirstOff)^.Ref=1) then
  359. begin
  360. RealDestP:=OldDestP-UnicodeFirstOff;
  361. NewDestP:=ReallocMem(RealDestP,UnicodeFirstOff+sizeof(UnicodeChar)+(S1Len+S2Len)*sizeof(UnicodeChar))+UnicodeFirstOff;
  362. { Copy S2 first, as in the case of OldDestP = Pointer(S2) it must be copied first and in other cases the order does not matter. }
  363. Src:=Pointer(S2);
  364. if Src=OldDestP then
  365. Src:=NewDestP;
  366. Move(Src^,PUnicodeChar(NewDestP)[S1Len],S2Len*sizeof(UnicodeChar));
  367. if OldDestP<>Pointer(S1) then { Not an append, need to copy S1? }
  368. Move(Pointer(S1)^,NewDestP^,S1Len*sizeof(UnicodeChar));
  369. end
  370. else
  371. begin
  372. NewDestP:=GetMem((S1Len+S2Len)*sizeof(UnicodeChar)+(UnicodeFirstOff+sizeof(UnicodeChar)))+UnicodeFirstOff;
  373. PUnicodeRec(NewDestP-UnicodeFirstOff)^.CodePage:=DefaultUnicodeCodePage;
  374. PUnicodeRec(NewDestP-UnicodeFirstOff)^.ElementSize:=sizeof(UnicodeChar);
  375. PUnicodeRec(NewDestP-UnicodeFirstOff)^.Ref:=1;
  376. Move(Pointer(S1)^,NewDestP^,S1Len*sizeof(UnicodeChar));
  377. Move(Pointer(S2)^,PUnicodeChar(NewDestP)[S1Len],S2Len*sizeof(UnicodeChar));
  378. fpc_unicodestr_decr_ref(Pointer(DestS));
  379. end;
  380. PUnicodeChar(NewDestP)[S1Len+S2Len]:=#0;
  381. PUnicodeRec(NewDestP-UnicodeFirstOff)^.Len:=S1Len+S2Len;
  382. Pointer(DestS):=NewDestP;
  383. end;
  384. {$endif FPC_HAS_UNICODESTR_CONCAT}
  385. {$ifndef FPC_HAS_UNICODESTR_CONCAT_MULTI}
  386. {$define FPC_HAS_UNICODESTR_CONCAT_MULTI}
  387. procedure fpc_UnicodeStr_Concat_multi (var DestS:Unicodestring;const sarr:array of Unicodestring); compilerproc;
  388. Var
  389. lowstart,i,Size,NewLen : SizeInt;
  390. p,pc,OldDestP,NewDestP,RealDestP : pointer;
  391. begin
  392. lowstart:=low(sarr);
  393. { skip empty strings }
  394. while (lowstart<=high(sarr)) and (sarr[lowstart]='') do
  395. inc(lowstart);
  396. if lowstart>high(sarr) then
  397. begin
  398. DestS:=''; { All source strings empty }
  399. exit;
  400. end;
  401. { Calculate size of the result so we can do
  402. a single call to SetLength() }
  403. NewLen:=0;
  404. for i:=lowstart to high(sarr) do
  405. inc(NewLen,length(sarr[i]));
  406. { In the case of the only nonempty string, return it directly. }
  407. if NewLen=PUnicodeRec(Pointer(sarr[lowstart])-UnicodeFirstOff)^.Len then
  408. begin
  409. DestS:=sarr[lowstart];
  410. exit;
  411. end;
  412. OldDestP:=Pointer(DestS);
  413. { Reallocate when possible; in the hope this will reuse the chunk more often than do a redundant copy. }
  414. if Assigned(OldDestP) and (PUnicodeRec(OldDestP-UnicodeFirstOff)^.Ref=1) then
  415. begin
  416. RealDestP:=OldDestP-UnicodeFirstOff;
  417. NewDestP:=ReallocMem(RealDestP,UnicodeFirstOff+sizeof(UnicodeChar)+NewLen*sizeof(UnicodeChar))+UnicodeFirstOff;
  418. { First string can be skipped if appending. }
  419. if OldDestP=Pointer(sarr[lowstart]) then
  420. inc(lowstart);
  421. end
  422. else
  423. begin
  424. { Create new string. }
  425. OldDestP:=nil; { This case is distinguished as "not assigned(olddestp)". Also prevents "if p=olddestp" in the loop below shared with the ReallocMem branch. }
  426. NewDestP:=GetMem(NewLen*sizeof(UnicodeChar)+(UnicodeFirstOff+sizeof(UnicodeChar)))+UnicodeFirstOff;
  427. PUnicodeRec(NewDestP-UnicodeFirstOff)^.CodePage:=DefaultUnicodeCodePage;
  428. PUnicodeRec(NewDestP-UnicodeFirstOff)^.ElementSize:=sizeof(UnicodeChar);
  429. PUnicodeRec(NewDestP-UnicodeFirstOff)^.Ref:=1;
  430. end;
  431. { Copy strings from last to the first, so that possible occurences of DestS could read from the beginning of the reallocated DestS. }
  432. pc:=NewDestP+NewLen*sizeof(UnicodeChar);
  433. PUnicodeChar(pc)^:=#0; { Conveniently write null terminator. }
  434. for i:=high(sarr) downto lowstart do
  435. begin
  436. p:=Pointer(sarr[i]);
  437. if not Assigned(p) then
  438. continue;
  439. if p=OldDestP then
  440. { DestS occured among pieces in the ReallocMem case! Use the new pointer. Its header still conveniently contains old DestS length. }
  441. p:=NewDestP;
  442. Size:=PUnicodeRec(p-UnicodeFirstOff)^.Len*sizeof(UnicodeChar);
  443. dec(pc,size);
  444. Move(p^,pc^,Size);
  445. end;
  446. PUnicodeRec(NewDestP-UnicodeFirstOff)^.Len:=NewLen; { Careful, loop above relies on the old Len in the NewDestP header. }
  447. if not assigned(OldDestP) then
  448. fpc_UnicodeStr_Decr_Ref(Pointer(DestS));
  449. Pointer(DestS):=NewDestP;
  450. end;
  451. {$endif FPC_HAS_UNICODESTR_CONCAT_MULTI}
  452. {$ifndef FPC_HAS_CHAR_TO_UCHAR}
  453. {$define FPC_HAS_CHAR_TO_UCHAR}
  454. Function fpc_Char_To_UChar(const c : AnsiChar): UnicodeChar; compilerproc;
  455. var
  456. w: unicodestring;
  457. begin
  458. widestringmanager.Ansi2UnicodeMoveProc(@c,DefaultSystemCodePage,w,1);
  459. fpc_Char_To_UChar:=w[1];
  460. end;
  461. {$endif FPC_HAS_CHAR_TO_UCHAR}
  462. {$ifndef FPC_HAS_CHAR_TO_UNICODESTR}
  463. {$define FPC_HAS_CHAR_TO_UNICODESTR}
  464. Function fpc_Char_To_UnicodeStr(const c : AnsiChar): UnicodeString; compilerproc;
  465. {
  466. Converts a AnsiChar to a UnicodeString;
  467. }
  468. begin
  469. widestringmanager.Ansi2UnicodeMoveProc(@c,DefaultSystemCodePage,result,1);
  470. end;
  471. {$endif FPC_HAS_CHAR_TO_UNICODESTR}
  472. {$ifndef FPC_HAS_UCHAR_TO_CHAR}
  473. {$define FPC_HAS_UCHAR_TO_CHAR}
  474. Function fpc_UChar_To_Char(const c : UnicodeChar): AnsiChar; compilerproc;
  475. {
  476. Converts a UnicodeChar to a AnsiChar;
  477. }
  478. var
  479. s: ansistring;
  480. begin
  481. widestringmanager.Unicode2AnsiMoveProc(@c, s, DefaultSystemCodePage, 1);
  482. if length(s)=1 then
  483. fpc_UChar_To_Char:= s[1]
  484. else
  485. fpc_UChar_To_Char:='?';
  486. end;
  487. {$endif FPC_HAS_UCHAR_TO_CHAR}
  488. {$ifndef FPC_HAS_UCHAR_TO_SHORTSTR}
  489. {$define FPC_HAS_UCHAR_TO_SHORTSTR}
  490. function fpc_UChar_To_ShortStr(const c : WideChar): shortstring; compilerproc;
  491. {
  492. Converts a WideChar to a ShortString;
  493. }
  494. var
  495. s: ansistring;
  496. begin
  497. widestringmanager.Wide2AnsiMoveProc(@c,s,DefaultSystemCodePage,1);
  498. result:=s;
  499. end;
  500. {$endif FPC_HAS_UCHAR_TO_SHORTSTR}
  501. {$ifndef FPC_HAS_UCHAR_TO_UNICODESTR}
  502. {$define FPC_HAS_UCHAR_TO_UNICODESTR}
  503. Function fpc_UChar_To_UnicodeStr(const c : UnicodeChar): UnicodeString; compilerproc;
  504. {
  505. Converts a UnicodeChar to a UnicodeString;
  506. }
  507. begin
  508. Setlength (fpc_UChar_To_UnicodeStr,1);
  509. fpc_UChar_To_UnicodeStr[1]:= c;
  510. end;
  511. {$endif FPC_HAS_UCHAR_TO_UNICODESTR}
  512. {$ifndef FPC_HAS_UCHAR_TO_ANSISTR}
  513. {$define FPC_HAS_UCHAR_TO_ANSISTR}
  514. Function fpc_UChar_To_AnsiStr(const c : UnicodeChar;cp : TSystemCodePage): AnsiString; compilerproc;
  515. {
  516. Converts a UnicodeChar to a AnsiString;
  517. }
  518. begin
  519. widestringmanager.Unicode2AnsiMoveProc(@c, fpc_UChar_To_AnsiStr, TranslatePlaceholderCP(cp), 1);
  520. end;
  521. {$endif FPC_HAS_UCHAR_TO_ANSISTR}
  522. {$ifndef FPC_HAS_PCHAR_TO_UNICODESTR}
  523. {$define FPC_HAS_PCHAR_TO_UNICODESTR}
  524. Function fpc_PChar_To_UnicodeStr(const p : PAnsiChar): UnicodeString; compilerproc;
  525. Var
  526. L : SizeInt;
  527. begin
  528. if (not assigned(p)) or (p[0]=#0) Then
  529. begin
  530. fpc_pchar_to_unicodestr := '';
  531. exit;
  532. end;
  533. l:=IndexChar(p^,-1,#0);
  534. widestringmanager.Ansi2UnicodeMoveProc(P,DefaultSystemCodePage,fpc_PChar_To_UnicodeStr,l);
  535. end;
  536. {$endif FPC_HAS_PCHAR_TO_UNICODESTR}
  537. {$ifndef FPC_HAS_CHARARRAY_TO_UNICODESTR}
  538. {$define FPC_HAS_CHARARRAY_TO_UNICODESTR}
  539. Function fpc_CharArray_To_UnicodeStr(const arr: array of ansichar; zerobased: boolean = true): UnicodeString; compilerproc;
  540. var
  541. i : SizeInt;
  542. begin
  543. if zerobased then
  544. begin
  545. if arr[0]=#0 Then
  546. begin
  547. fpc_chararray_to_unicodestr:='';
  548. exit;
  549. end;
  550. i:=IndexChar(arr,high(arr)+1,#0);
  551. if i=-1 then
  552. i:=high(arr)+1;
  553. end
  554. else
  555. i:=high(arr)+1;
  556. widestringmanager.Ansi2UnicodeMoveProc(pansichar(@arr),DefaultSystemCodePage,fpc_CharArray_To_UnicodeStr,i);
  557. end;
  558. {$endif FPC_HAS_CHARARRAY_TO_UNICODESTR}
  559. {$ifndef FPC_HAS_WIDECHARARRAY_TO_UNICODESTR}
  560. {$define FPC_HAS_WIDECHARARRAY_TO_UNICODESTR}
  561. Function fpc_WideCharArray_To_UnicodeStr(const arr: array of widechar; zerobased: boolean = true): UnicodeString; compilerproc;
  562. var
  563. i : SizeInt;
  564. begin
  565. if (zerobased) then
  566. begin
  567. i:=IndexWord(arr,high(arr)+1,0);
  568. if i = -1 then
  569. i := high(arr)+1;
  570. end
  571. else
  572. i := high(arr)+1;
  573. SetLength(fpc_WideCharArray_To_UnicodeStr,i);
  574. Move(arr[0], Pointer(fpc_WideCharArray_To_UnicodeStr)^,i*sizeof(WideChar));
  575. end;
  576. {$endif FPC_HAS_WIDECHARARRAY_TO_UNICODESTR}
  577. {$ifndef FPC_HAS_WIDECHARARRAY_TO_SHORTSTR}
  578. {$define FPC_HAS_WIDECHARARRAY_TO_SHORTSTR}
  579. { due to their names, the following procedures should be in wstrings.inc,
  580. however, the compiler generates code using this functions on all platforms }
  581. procedure fpc_WideCharArray_To_ShortStr(out res : shortstring;const arr: array of widechar; zerobased: boolean = true);[public,alias:'FPC_WIDECHARARRAY_TO_SHORTSTR']; compilerproc;
  582. var
  583. l: longint;
  584. index: ptrint;
  585. len: byte;
  586. temp: ansistring;
  587. begin
  588. l := high(arr)+1;
  589. if l>=high(res)+1 then
  590. l:=high(res)
  591. else if l<0 then
  592. l:=0;
  593. if zerobased then
  594. begin
  595. index:=IndexWord(arr[0],l,0);
  596. if index<0 then
  597. len:=l
  598. else
  599. len:=index;
  600. end
  601. else
  602. len:=l;
  603. widestringmanager.Wide2AnsiMoveProc (pwidechar(@arr),temp,DefaultSystemCodePage,len);
  604. res:=temp;
  605. end;
  606. {$endif FPC_HAS_WIDECHARARRAY_TO_SHORTSTR}
  607. {$ifndef FPC_HAS_WIDECHARARRAY_TO_ANSISTR}
  608. {$define FPC_HAS_WIDECHARARRAY_TO_ANSISTR}
  609. Function fpc_WideCharArray_To_AnsiStr(const arr: array of widechar; cp : TSystemCodePage; zerobased: boolean = true): AnsiString; compilerproc;
  610. var
  611. i : SizeInt;
  612. begin
  613. if (zerobased) then
  614. begin
  615. i:=IndexWord(arr,high(arr)+1,0);
  616. if i = -1 then
  617. i := high(arr)+1;
  618. end
  619. else
  620. i := high(arr)+1;
  621. if i > 0 then
  622. widestringmanager.Wide2AnsiMoveProc (pwidechar(@arr),RawByteString(fpc_WideCharArray_To_AnsiStr),TranslatePlaceholderCP(cp),i)
  623. else
  624. fpc_WideCharArray_To_AnsiStr:='';
  625. end;
  626. {$endif FPC_HAS_WIDECHARARRAY_TO_ANSISTR}
  627. {$ifndef FPC_HAS_WIDECHARARRAY_TO_WIDESTR}
  628. {$define FPC_HAS_WIDECHARARRAY_TO_WIDESTR}
  629. Function fpc_WideCharArray_To_WideStr(const arr: array of widechar; zerobased: boolean = true): WideString; compilerproc;
  630. var
  631. i : SizeInt;
  632. begin
  633. if (zerobased) then
  634. begin
  635. i:=IndexWord(arr,high(arr)+1,0);
  636. if i = -1 then
  637. i := high(arr)+1;
  638. end
  639. else
  640. i := high(arr)+1;
  641. SetLength(fpc_WideCharArray_To_WideStr,i);
  642. Move(arr[0], Pointer(fpc_WideCharArray_To_WideStr)^,i*sizeof(WideChar));
  643. end;
  644. {$endif FPC_HAS_WIDECHARARRAY_TO_WIDESTR}
  645. {$ifndef FPC_HAS_UNICODESTR_TO_CHARARRAY}
  646. {$define FPC_HAS_UNICODESTR_TO_CHARARRAY}
  647. procedure fpc_unicodestr_to_chararray(out res: array of AnsiChar; const src: UnicodeString); compilerproc;
  648. var
  649. len: SizeInt;
  650. temp: ansistring;
  651. begin
  652. len := length(src);
  653. { make sure we don't dereference src if it can be nil (JM) }
  654. if len > 0 then
  655. widestringmanager.unicode2ansimoveproc(punicodechar(pointer(src)),temp,DefaultSystemCodePage,len);
  656. len := length(temp);
  657. if len > length(res) then
  658. len := length(res);
  659. {$push}
  660. {$r-}
  661. move(temp[1],res[0],len);
  662. fillchar(res[len],length(res)-len,0);
  663. {$pop}
  664. end;
  665. {$endif FPC_HAS_UNICODESTR_TO_UNICODECHARARRAY}
  666. {$ifndef FPC_HAS_ANSISTR_TO_WIDECHARARRAY}
  667. {$define FPC_HAS_ANSISTR_TO_WIDECHARARRAY}
  668. procedure fpc_ansistr_to_widechararray(out res: array of widechar; const src: RawByteString); compilerproc;
  669. var
  670. len: SizeInt;
  671. temp: widestring;
  672. begin
  673. len := length(src);
  674. { make sure we don't dereference src if it can be nil (JM) }
  675. if len > 0 then
  676. widestringmanager.ansi2widemoveproc(pansichar(@src[1]),TranslatePlaceholderCP(StringCodePage(src)),temp,len);
  677. len := length(temp);
  678. if len > length(res) then
  679. len := length(res);
  680. {$push}
  681. {$r-}
  682. move(temp[1],res[0],len*sizeof(widechar));
  683. fillchar(res[len],(length(res)-len)*SizeOf(WideChar),0);
  684. {$pop}
  685. end;
  686. {$endif FPC_HAS_ANSISTR_TO_WIDECHARARRAY}
  687. {$ifndef FPC_HAS_SHORTSTR_TO_WIDECHARARRAY}
  688. {$define FPC_HAS_SHORTSTR_TO_WIDECHARARRAY}
  689. procedure fpc_shortstr_to_widechararray(out res: array of widechar; const src: ShortString); compilerproc;
  690. var
  691. len: longint;
  692. temp : widestring;
  693. begin
  694. len := length(src);
  695. { make sure we don't access AnsiChar 1 if length is 0 (JM) }
  696. if len > 0 then
  697. widestringmanager.ansi2widemoveproc(pansichar(@src[1]),DefaultSystemCodePage,temp,len);
  698. len := length(temp);
  699. if len > length(res) then
  700. len := length(res);
  701. {$push}
  702. {$r-}
  703. move(temp[1],res[0],len*sizeof(widechar));
  704. fillchar(res[len],(length(res)-len)*SizeOf(WideChar),0);
  705. {$pop}
  706. end;
  707. {$endif FPC_HAS_SHORTSTR_TO_WIDECHARARRAY}
  708. {$ifndef FPC_HAS_UNICODESTR_TO_WIDECHARARRAY}
  709. {$define FPC_HAS_UNICODESTR_TO_WIDECHARARRAY}
  710. procedure fpc_unicodestr_to_widechararray(out res: array of widechar; const src: UnicodeString); compilerproc;
  711. var
  712. len: SizeInt;
  713. begin
  714. len := length(src);
  715. if len > length(res) then
  716. len := length(res);
  717. {$push}
  718. {$r-}
  719. { make sure we don't try to access element 1 of the widestring if it's nil }
  720. if len > 0 then
  721. move(src[1],res[0],len*SizeOf(WideChar));
  722. fillchar(res[len],(length(res)-len)*SizeOf(WideChar),0);
  723. {$pop}
  724. end;
  725. {$endif FPC_HAS_UNICODESTR_TO_WIDECHARARRAY}
  726. {$ifndef FPC_HAS_UNICODESTR_COMPARE}
  727. {$define FPC_HAS_UNICODESTR_COMPARE}
  728. Function fpc_UnicodeStr_Compare(const S1,S2 : UnicodeString): SizeInt;[Public,Alias : 'FPC_UNICODESTR_COMPARE']; compilerproc;
  729. {
  730. Compares 2 UnicodeStrings;
  731. The result is
  732. <0 if S1<S2
  733. 0 if S1=S2
  734. >0 if S1>S2
  735. }
  736. Var
  737. MaxI,Temp : SizeInt;
  738. begin
  739. if pointer(S1)=pointer(S2) then
  740. begin
  741. fpc_UnicodeStr_Compare:=0;
  742. exit;
  743. end;
  744. Maxi:=Length(S1);
  745. temp:=Length(S2);
  746. If MaxI>Temp then
  747. MaxI:=Temp;
  748. Temp:=CompareWord(S1[1],S2[1],MaxI);
  749. if temp=0 then
  750. temp:=Length(S1)-Length(S2);
  751. fpc_UnicodeStr_Compare:=Temp;
  752. end;
  753. {$endif FPC_HAS_UNICODESTR_COMPARE}
  754. {$ifndef FPC_HAS_UNICODESTR_COMPARE_EQUAL}
  755. {$define FPC_HAS_UNICODESTR_COMPARE_EQUAL}
  756. Function fpc_UnicodeStr_Compare_Equal(const S1,S2 : UnicodeString): SizeInt;[Public,Alias : 'FPC_UNICODESTR_COMPARE_EQUAL']; compilerproc;
  757. {
  758. Compares 2 UnicodeStrings for equality only;
  759. The result is
  760. 0 if S1=S2
  761. <>0 if S1<>S2
  762. }
  763. Var
  764. MaxI : SizeInt;
  765. begin
  766. if pointer(S1)=pointer(S2) then
  767. exit(0);
  768. Maxi:=Length(S1);
  769. If MaxI<>Length(S2) then
  770. exit(-1)
  771. else
  772. exit(CompareWord(S1[1],S2[1],MaxI));
  773. end;
  774. {$endif FPC_HAS_UNICODESTR_COMPARE_EQUAL}
  775. {$ifndef FPC_HAS_UNICODESTR_RANGECHECK}
  776. {$define FPC_HAS_UNICODESTR_RANGECHECK}
  777. Procedure fpc_UnicodeStr_RangeCheck(p: Pointer; index: SizeInt);[Public,Alias : 'FPC_UNICODESTR_RANGECHECK']; compilerproc;
  778. begin
  779. if (p=nil) or (index>PUnicodeRec(p-UnicodeFirstOff)^.len) or (Index<1) then
  780. HandleErrorAddrFrameInd(201,get_pc_addr,get_frame);
  781. end;
  782. Procedure fpc_UnicodeStr_ZeroBased_RangeCheck(p: Pointer; index: SizeInt);[Public,Alias : 'FPC_UNICODESTR_ZEROBASED_RANGECHECK']; compilerproc;
  783. begin
  784. if (p=nil) or (index>=PUnicodeRec(p-UnicodeFirstOff)^.len) or (Index<0) then
  785. HandleErrorAddrFrameInd(201,get_pc_addr,get_frame);
  786. end;
  787. {$endif FPC_HAS_UNICODESTR_RANGECHECK}
  788. {$ifndef FPC_HAS_UNICODESTR_SETLENGTH}
  789. {$define FPC_HAS_UNICODESTR_SETLENGTH}
  790. Procedure fpc_UnicodeStr_SetLength(Var S : UnicodeString; l : SizeInt);[Public,Alias : 'FPC_UNICODESTR_SETLENGTH']; compilerproc;
  791. {
  792. Sets The length of string S to L.
  793. Makes sure S is unique, and contains enough room.
  794. }
  795. Var
  796. sp,oldsp,realsp : Pointer;
  797. lens, lena : SizeInt;
  798. begin
  799. if l<=0 then { length=0, deallocate the string }
  800. begin
  801. fpc_unicodestr_decr_ref (Pointer(S));
  802. exit;
  803. end;
  804. sp:=Pointer(S);
  805. if (sp<>nil) and (PUnicodeRec(sp-UnicodeFirstOff)^.Ref=1) then
  806. begin
  807. lens:=MemSize(sp-UnicodeFirstOff);
  808. lena:=L*sizeof(UnicodeChar)+(UnicodeFirstOff+sizeof(UnicodeChar));
  809. if (lena>lens) or (lena+16<=SizeInt(SizeUint(lens) div 2)) then
  810. begin
  811. realsp:=sp-UnicodeFirstOff;
  812. sp:=reallocmem(realsp,lena)+UnicodeFirstOff;
  813. end;
  814. end
  815. else
  816. begin
  817. { Reallocation is needed... }
  818. oldsp:=sp;
  819. sp:=GetMem(l*sizeof(UnicodeChar)+(UnicodeFirstOff+sizeof(UnicodeChar)))+UnicodeFirstOff;
  820. PUnicodeRec(sp-UnicodeFirstOff)^.CodePage:=DefaultUnicodeCodePage;
  821. PUnicodeRec(sp-UnicodeFirstOff)^.ElementSize:=sizeof(UnicodeChar);
  822. PUnicodeRec(sp-UnicodeFirstOff)^.Ref:=1;
  823. if oldsp<>nil then
  824. begin
  825. lens:=PUnicodeRec(oldsp-UnicodeFirstOff)^.Len;
  826. if l<lens then
  827. lens:=l;
  828. Move(oldsp^,sp^,lens * Sizeof(UnicodeChar));
  829. fpc_unicodestr_decr_ref(Pointer(S));
  830. end;
  831. end;
  832. { Null-terminate. }
  833. PWord(sp)[l]:=0;
  834. PUnicodeRec(sp-UnicodeFirstOff)^.Len:=l;
  835. Pointer(S):=sp;
  836. end;
  837. {$endif FPC_HAS_UNICODESTR_SETLENGTH}
  838. {*****************************************************************************
  839. Public functions, In interface.
  840. *****************************************************************************}
  841. function UnicodeCharToString(S : PUnicodeChar) : UnicodeString;
  842. begin
  843. result:=UnicodeCharLenToString(s,Length(UnicodeString(s)));
  844. end;
  845. {$ifndef FPC_HAS_STRING_TO_UNICODECHAR}
  846. {$define FPC_HAS_STRING_TO_UNICODECHAR}
  847. function StringToUnicodeChar(const Src : RawByteString;Dest : PUnicodeChar;DestSize : SizeInt) : PUnicodeChar;
  848. begin
  849. result:=StringToWideChar(Src,Dest,DestSize);
  850. end;
  851. {$endif FPC_HAS_STRING_TO_UNICODECHAR}
  852. function WideCharToString(S : PWideChar) : UnicodeString;
  853. begin
  854. result:=WideCharLenToString(s,Length(WideString(s)));
  855. end;
  856. {$ifndef FPC_HAS_STRING_LEN_TO_WIDECHAR}
  857. {$define FPC_HAS_STRING_LEN_TO_WIDECHAR}
  858. function StringToWideChar(const Src : RawByteString;Dest : PWideChar;DestSize : SizeInt) : PWideChar;
  859. var
  860. temp: widestring;
  861. Len: SizeInt;
  862. begin
  863. widestringmanager.Ansi2WideMoveProc(PAnsiChar(Src),StringCodePage(Src),temp,Length(Src));
  864. Len:=Length(temp);
  865. if DestSize<=Len then
  866. Len:=Destsize-1;
  867. move(temp[1],Dest^,Len*SizeOf(WideChar));
  868. Dest[Len]:=#0;
  869. result:=Dest;
  870. end;
  871. {$endif FPC_HAS_STRING_LEN_TO_WIDECHAR}
  872. {$ifndef FPC_HAS_UNICODEFROMLOCALECHARS}
  873. {$define FPC_HAS_UNICODEFROMLOCALECHARS}
  874. function UnicodeFromLocaleChars(CodePage, Flags: Cardinal; LocaleStr: PAnsiChar;
  875. LocaleStrLen: SizeInt; UnicodeStr: PWideChar; UnicodeStrLen: SizeInt): SizeInt; overload;
  876. var
  877. temp: widestring;
  878. Len: SizeInt;
  879. begin
  880. widestringmanager.Ansi2WideMoveProc(LocaleStr,CodePage,temp,LocaleStrLen);
  881. Len:=Length(temp);
  882. // Only move when we have room.
  883. if (UnicodeStrLen>0) then
  884. begin
  885. if UnicodeStrLen<=Len then
  886. Len:=UnicodeStrLen-1;
  887. move(temp[1],UnicodeStr^,Len*SizeOf(WideChar));
  888. UnicodeStr[Len]:=#0;
  889. end;
  890. // Return length
  891. result:=len;
  892. end;
  893. {$endif ndef FPC_HAS_UNICODEFROMLOCALECHARS}
  894. function UnicodeFromLocaleChars(const LocaleName: AnsiString; Flags: Cardinal;
  895. LocaleStr: PAnsiChar; LocaleStrLen: SizeInt; UnicodeStr: PWideChar;
  896. UnicodeStrLen: SizeInt): SizeInt; overload;
  897. var
  898. CP : TSystemCodePage;
  899. begin
  900. if not LocaleNameToCodePage(LocaleName,CP) then
  901. Result:=0
  902. else
  903. Result:=UnicodeFromLocaleChars(CP,Flags,LocaleStr,LocaleStrLen,UnicodeStr,UnicodeStrLen);
  904. end;
  905. {$ifndef FPC_HAS_UNICODECHAR_LEN_TO_STRING}
  906. {$define FPC_HAS_UNICODECHAR_LEN_TO_STRING}
  907. function UnicodeCharLenToString(S : PUnicodeChar;Len : SizeInt) : UnicodeString;
  908. begin
  909. SetLength(result,Len);
  910. Move(S^,Pointer(Result)^,Len*2);
  911. end;
  912. {$endif FPC_HAS_UNICODECHAR_LEN_TO_STRING}
  913. procedure UnicodeCharLenToStrVar(Src : PUnicodeChar;Len : SizeInt;out Dest : UnicodeString);
  914. begin
  915. Dest:=UnicodeCharLenToString(Src,Len);
  916. end;
  917. procedure UnicodeCharLenToStrVar(Src : PUnicodeChar;Len : SizeInt;out Dest : AnsiString);
  918. begin
  919. Dest:=AnsiString(UnicodeCharLenToString(Src,Len));
  920. end;
  921. procedure UnicodeCharToStrVar(S : PUnicodeChar;out Dest : AnsiString);
  922. begin
  923. Dest:=AnsiString(UnicodeCharToString(S));
  924. end;
  925. {$ifndef FPC_HAS_WIDECHAR_LEN_TO_STRING}
  926. {$define FPC_HAS_WIDECHAR_LEN_TO_STRING}
  927. function WideCharLenToString(S : PWideChar;Len : SizeInt) : UnicodeString;
  928. begin
  929. SetLength(result,Len);
  930. Move(S^,Pointer(Result)^,Len*2);
  931. end;
  932. {$endif FPC_HAS_WIDECHAR_LEN_TO_STRING}
  933. procedure WideCharLenToStrVar(Src : PWideChar;Len : SizeInt;out Dest : UnicodeString);
  934. begin
  935. Dest:=WideCharLenToString(Src,Len);
  936. end;
  937. procedure WideCharLenToStrVar(Src : PWideChar;Len : SizeInt;out Dest : AnsiString);
  938. begin
  939. Dest:=AnsiString(WideCharLenToString(Src,Len));
  940. end;
  941. procedure WideCharToStrVar(S : PWideChar;out Dest : UnicodeString);
  942. begin
  943. Dest:=WideCharToString(S);
  944. end;
  945. procedure WideCharToStrVar(S : PWideChar;out Dest : AnsiString);
  946. begin
  947. Dest:=AnsiString(WideCharToString(S));
  948. end;
  949. Function fpc_unicodestr_Unique_func(Var S : UnicodeString): Pointer; external name 'FPC_UNICODESTR_UNIQUE';
  950. Procedure UniqueString (Var S : UnicodeString);{$ifdef SYSTEMINLINE}inline;{$endif}
  951. begin
  952. fpc_unicodestr_Unique_func(S);
  953. end;
  954. {$ifndef FPC_HAS_UNICODESTR_UNIQUE}
  955. {$define FPC_HAS_UNICODESTR_UNIQUE}
  956. Function fpc_unicodestr_Unique(Var S : Pointer): Pointer; [Public,Alias : 'FPC_UNICODESTR_UNIQUE']; compilerproc;
  957. {
  958. Make sure reference count of S is 1,
  959. using copy-on-write semantics.
  960. }
  961. Var
  962. SNew : Pointer;
  963. FullSize : SizeInt;
  964. begin
  965. result:=S;
  966. If (result<>nil) and (PUnicodeRec(result-UnicodeFirstOff)^.Ref<>1) then
  967. begin
  968. FullSize:=PUnicodeRec(result-UnicodeFirstOff)^.Len*sizeof(UnicodeChar)+(UnicodeFirstOff+sizeof(UnicodeChar));
  969. SNew:=GetMem(FullSize)+UnicodeFirstOff;
  970. Move ((result-UnicodeFirstOff)^,(SNew-UnicodeFirstOff)^,FullSize); { Copy everything including header and #0, only refcount needs to be adjusted. }
  971. PUnicodeRec(SNew-UnicodeFirstOff)^.Ref:=1;
  972. fpc_unicodestr_decr_ref (S); { Thread safe }
  973. S:=SNew;
  974. result:=SNew;
  975. end;
  976. end;
  977. {$endif FPC_HAS_UNICODESTR_UNIQUE}
  978. {$ifndef FPC_HAS_UNICODESTR_COPY}
  979. {$define FPC_HAS_UNICODESTR_COPY}
  980. Function Fpc_UnicodeStr_Copy (Const S : UnicodeString; Index,Size : SizeInt) : UnicodeString;compilerproc;
  981. var
  982. Lim : SizeInt;
  983. ResultAddress : Pointer;
  984. begin
  985. ResultAddress:=Nil;
  986. if Index < 1 then
  987. Index := 1;
  988. dec(index);
  989. Lim:=Length(S)-Index; { Cannot overflow as both Length(S) and Index are non-negative. }
  990. if Size>Lim then
  991. Size:=Lim;
  992. If Size>0 then
  993. begin
  994. ResultAddress:=GetMem(Size*sizeof(UnicodeChar)+(UnicodeFirstOff+sizeof(UnicodeChar)))+UnicodeFirstOff;
  995. PUnicodeRec(ResultAddress-UnicodeFirstOff)^.CodePage:=DefaultUnicodeCodePage;
  996. PUnicodeRec(ResultAddress-UnicodeFirstOff)^.ElementSize:=sizeof(UnicodeChar);
  997. PUnicodeRec(ResultAddress-UnicodeFirstOff)^.Ref:=1;
  998. PUnicodeRec(ResultAddress-UnicodeFirstOff)^.Len:=Size;
  999. Move (PUnicodeChar(Pointer(S))[Index],ResultAddress^,Size*sizeof(UnicodeChar));
  1000. PUnicodeChar(ResultAddress)[Size]:=#0;
  1001. end;
  1002. fpc_unicodestr_decr_ref(Pointer(fpc_unicodestr_copy));
  1003. Pointer(fpc_unicodestr_Copy):=ResultAddress;
  1004. end;
  1005. {$endif FPC_HAS_UNICODESTR_COPY}
  1006. {$ifndef FPC_HAS_POS_UNICODESTR_UNICODESTR}
  1007. {$define FPC_HAS_POS_UNICODESTR_UNICODESTR}
  1008. Function Pos (Const Substr : UnicodeString; Const Source : UnicodeString; Offset: Sizeint = 1) : SizeInt;
  1009. var
  1010. i,MaxLen,nsource,nsub,d : SizeInt;
  1011. begin
  1012. Pos:=0;
  1013. nsource:=Length(Source);
  1014. nsub:=Length(Substr);
  1015. if (nsub>0) and (Offset>0) and (Offset<=nsource) then
  1016. begin
  1017. MaxLen:=nsource-nsub+1;
  1018. i:=Offset;
  1019. while (i<=MaxLen) do
  1020. begin
  1021. d:=IndexWord(Source[i],MaxLen-i+1,word(Substr[1]));
  1022. if d<0 then
  1023. exit;
  1024. if CompareWord(Substr[1],Source[i+d],nsub)=0 then
  1025. exit(i+d);
  1026. i:=i+d+1;
  1027. end;
  1028. end;
  1029. end;
  1030. {$endif FPC_HAS_POS_UNICODESTR_UNICODESTR}
  1031. {$ifndef FPC_HAS_POS_UNICODECHAR_UNICODESTR}
  1032. {$define FPC_HAS_POS_UNICODECHAR_UNICODESTR}
  1033. { Faster version for a unicodechar alone }
  1034. Function Pos (c : UnicodeChar; Const s : UnicodeString; Offset: Sizeint = 1) : SizeInt;
  1035. var
  1036. ns,idx: SizeInt;
  1037. begin
  1038. pos:=0;
  1039. ns:=length(s);
  1040. if (Offset>0) and (Offset<=ns) then
  1041. begin
  1042. idx:=IndexWord(s[Offset],ns-Offset+1,word(c));
  1043. if idx>=0 then
  1044. pos:=Offset+idx;
  1045. end;
  1046. end;
  1047. {$endif FPC_HAS_POS_UNICODECHAR_UNICODESTR}
  1048. { DO NOT inline these! Inlining a managed typecast creates an implicit try..finally
  1049. block, which is significant bloat without any sensible speed improvement. }
  1050. Function Pos (const c : RawByteString; Const s : UnicodeString; Offset: Sizeint = 1) : SizeInt;
  1051. begin
  1052. result:=Pos(UnicodeString(c),s,offset);
  1053. end;
  1054. Function Pos (const c : ShortString; Const s : UnicodeString; Offset: Sizeint = 1) : SizeInt;
  1055. begin
  1056. result:=Pos(UnicodeString(c),s,OffSet);
  1057. end;
  1058. Function Pos (const c : UnicodeString; Const s : RawByteString; Offset: Sizeint = 1) : SizeInt;
  1059. begin
  1060. result:=Pos(c,UnicodeString(s),OffSet);
  1061. end;
  1062. {$ifndef FPC_HAS_UNICODESTR_OF_CHAR}
  1063. {$define FPC_HAS_UNICODESTR_OF_CHAR}
  1064. Function StringOfChar(c : Unicodechar;l : SizeInt) : UnicodeString;
  1065. begin
  1066. SetLength(StringOfChar,l);
  1067. FillWord(Pointer(StringOfChar)^,Length(StringOfChar),word(c));
  1068. end;
  1069. {$endif}
  1070. {$ifndef FPC_HAS_POS_CHAR_UNICODESTR}
  1071. {$define FPC_HAS_POS_CHAR_UNICODESTR}
  1072. { Faster version for a AnsiChar alone. Must be implemented because }
  1073. { pos(c: AnsiChar; const s: shortstring) also exists, so otherwise }
  1074. { using pos(AnsiChar,pansichar) will always call the shortstring version }
  1075. { (exact match for first argument), also with $h+ (JM) }
  1076. Function Pos (c : AnsiChar; Const s : UnicodeString; Offset: Sizeint = 1) : SizeInt;
  1077. var
  1078. ns,idx: SizeInt;
  1079. begin
  1080. pos:=0;
  1081. ns:=length(s);
  1082. if (Offset>0) and (Offset<=ns) then
  1083. begin
  1084. idx:=IndexWord(s[Offset],ns-Offset+1,word(unicodechar(c)));
  1085. if idx>=0 then
  1086. pos:=Offset+idx;
  1087. end;
  1088. end;
  1089. {$endif FPC_HAS_POS_CHAR_UNICODESTR}
  1090. {$ifndef FPC_HAS_DELETE_UNICODESTR}
  1091. {$define FPC_HAS_DELETE_UNICODESTR}
  1092. Procedure fpc_unicodestr_delete(Var S : UnicodeString; Index,Size: SizeInt);
  1093. Var
  1094. LS : SizeInt;
  1095. begin
  1096. LS:=Length(S);
  1097. if (Index>LS) or (Index<=0) or (Size<=0) then
  1098. exit;
  1099. UniqueString (S);
  1100. { (Size+Index) will overflow if Size=MaxInt. }
  1101. if Size>LS-Index then
  1102. Size:=LS-Index+1;
  1103. if Size<=LS-Index then
  1104. begin
  1105. Dec(Index);
  1106. Move(PUnicodeChar(S)[Index+Size],PUnicodeChar(S)[Index],(LS-Index-Size+1)*sizeof(UnicodeChar));
  1107. end;
  1108. Setlength(s,LS-Size);
  1109. end;
  1110. {$endif FPC_HAS_DELETE_UNICODESTR}
  1111. {$ifndef FPC_HAS_INSERT_UNICODESTR}
  1112. {$define FPC_HAS_INSERT_UNICODESTR}
  1113. Procedure fpc_unicodestr_insert(Const Source : UnicodeString; Var S : UnicodeString; Index : SizeInt);
  1114. var
  1115. LS,LSource : SizeInt;
  1116. selfinsert : boolean;
  1117. srcp : PUnicodeChar;
  1118. begin
  1119. If Source='' then
  1120. exit;
  1121. if S='' then
  1122. begin
  1123. S:=Source;
  1124. exit;
  1125. end;
  1126. LSource:=PUnicodeRec(Pointer(Source)-UnicodeFirstOff)^.Len;
  1127. LS:=PUnicodeRec(Pointer(S)-UnicodeFirstOff)^.Len;
  1128. if index < 1 then
  1129. index := 1;
  1130. Dec(Index);
  1131. if index > LS then
  1132. index := LS;
  1133. selfinsert:=Pointer(Source)=Pointer(S);
  1134. SetLength(S,LSource+LS);
  1135. Move(PUnicodeChar(Pointer(S))[Index],PUnicodeChar(Pointer(S))[Index+LSource],(LS-Index)*sizeof(UnicodeChar));
  1136. srcp:=Pointer(Source);
  1137. if selfinsert then
  1138. srcp:=Pointer(S);
  1139. Move(srcp^,PUnicodeChar(Pointer(S))[Index],LSource*SizeOf(UnicodeChar));
  1140. end;
  1141. {$endif FPC_HAS_INSERT_UNICODESTR}
  1142. {$ifndef FPC_HAS_UPCASE_UNICODECHAR}
  1143. {$define FPC_HAS_UPCASE_UNICODECHAR}
  1144. Function UpCase(c:UnicodeChar):UnicodeChar;
  1145. begin
  1146. Result:= widestringmanager.UpperUnicodeStringProc(UnicodeString(c))[1]
  1147. end;
  1148. {$endif FPC_HAS_UPCASE_UNICODECHAR}
  1149. {$ifndef FPC_HAS_UPCASE_UNICODESTR}
  1150. {$define FPC_HAS_UPCASE_UNICODESTR}
  1151. function UpCase(const s : UnicodeString) : UnicodeString;
  1152. begin
  1153. result:=widestringmanager.UpperUnicodeStringProc(s);
  1154. end;
  1155. {$endif FPC_HAS_UPCASE_UNICODESTR}
  1156. {$ifndef FPC_HAS_LOWERCASE_UNICODECHAR}
  1157. {$define FPC_HAS_LOWERCASE_UNICODECHAR}
  1158. Function LowerCase(c:UnicodeChar):UnicodeChar;
  1159. begin
  1160. Result:= widestringmanager.LowerUnicodeStringProc(UnicodeString(c))[1]
  1161. end;
  1162. {$endif FPC_HAS_LOWERCASE_UNICODECHAR}
  1163. {$ifndef FPC_HAS_LOWERCASE_UNICODESTR}
  1164. {$define FPC_HAS_LOWERCASE_UNICODESTR}
  1165. function LowerCase(const s : UnicodeString) : UnicodeString;
  1166. begin
  1167. result:=widestringmanager.LowerUnicodeStringProc(s);
  1168. end;
  1169. {$endif FPC_HAS_LOWERCASE_UNICODESTR}
  1170. {$ifndef FPC_HAS_SETSTRING_UNICODESTR_PUNICODECHAR}
  1171. {$define FPC_HAS_SETSTRING_UNICODESTR_PUNICODECHAR}
  1172. Procedure fpc_setstring_unicodestr_pwidechar(Out S : UnicodeString; Buf : PUnicodeChar; Len : SizeInt); compilerproc;
  1173. begin
  1174. SetLength(S,Len);
  1175. If (Buf<>Nil) and (Len>0) then
  1176. Move (Buf[0],S[1],Len*sizeof(UnicodeChar));
  1177. end;
  1178. {$endif FPC_HAS_SETSTRING_UNICODESTR_PUNICODECHAR}
  1179. {$ifndef FPC_HAS_SETSTRING_UNICODESTR_PCHAR}
  1180. {$define FPC_HAS_SETSTRING_UNICODESTR_PCHAR}
  1181. Procedure fpc_setstring_unicodestr_pansichar(Out S : UnicodeString; Buf : PAnsiChar; Len : SizeInt); compilerproc;
  1182. begin
  1183. If (Buf<>Nil) and (Len>0) then
  1184. widestringmanager.Ansi2UnicodeMoveProc(Buf,DefaultSystemCodePage,S,Len)
  1185. else
  1186. SetLength(S,Len);
  1187. end;
  1188. {$endif FPC_HAS_SETSTRING_UNICODESTR_PCHAR}
  1189. {$ifndef FPUNONE}
  1190. Function fpc_Val_Real_UnicodeStr(Const S : UnicodeString; out Code : ValSInt): ValReal; [public, alias:'FPC_VAL_REAL_UNICODESTR']; compilerproc;
  1191. Var
  1192. SS: ShortString;
  1193. begin
  1194. fpc_Val_Real_UnicodeStr:=0;
  1195. if length(S)>255 then
  1196. code:=256
  1197. else
  1198. begin
  1199. SS:=ShortString(S);
  1200. Val(SS,fpc_Val_Real_UnicodeStr,code);
  1201. end;
  1202. end;
  1203. {$endif}
  1204. {$ifndef FPC_STR_ENUM_INTERN}
  1205. function fpc_val_enum_unicodestr(str2ordindex:pointer;const s:unicodestring;out code:valsint):longint;compilerproc;
  1206. var
  1207. ss: ShortString;
  1208. begin
  1209. if length(s)>255 then
  1210. code:=256
  1211. else
  1212. begin
  1213. ss:=ShortString(s);
  1214. val(ss,fpc_val_enum_unicodestr,code);
  1215. end;
  1216. end;
  1217. {$endif FPC_STR_ENUM_INTERN}
  1218. Function fpc_Val_Currency_UnicodeStr(Const S : UnicodeString; out Code : ValSInt): Currency; [public, alias:'FPC_VAL_CURRENCY_UNICODESTR']; compilerproc;
  1219. Var
  1220. SS: ShortString;
  1221. begin
  1222. if length(S)>255 then
  1223. begin
  1224. fpc_Val_Currency_UnicodeStr:=0;
  1225. code:=256;
  1226. end
  1227. else
  1228. begin
  1229. SS:=ShortString(S);
  1230. Val(SS,fpc_Val_Currency_UnicodeStr,code);
  1231. end;
  1232. end;
  1233. Function fpc_Val_UInt_UnicodeStr ({$ifndef VER3_2}DestSize: SizeInt;{$endif VER3_2} Const S : UnicodeString; out Code : ValSInt): ValUInt; [public, alias:'FPC_VAL_UINT_UNICODESTR']; compilerproc;
  1234. Var
  1235. SS: ShortString;
  1236. begin
  1237. fpc_Val_UInt_UnicodeStr:=0;
  1238. if length(S)>255 then
  1239. code:=256
  1240. else
  1241. begin
  1242. SS:=ShortString(S);
  1243. Val(SS,fpc_Val_UInt_UnicodeStr,code);
  1244. end;
  1245. end;
  1246. Function fpc_Val_SInt_UnicodeStr (DestSize: SizeInt; Const S : UnicodeString; out Code : ValSInt): ValSInt; [public, alias:'FPC_VAL_SINT_UNICODESTR']; compilerproc;
  1247. Var
  1248. SS: ShortString;
  1249. begin
  1250. fpc_Val_SInt_UnicodeStr:=0;
  1251. if length(S)>255 then
  1252. code:=256
  1253. else
  1254. begin
  1255. SS:=ShortString(S);
  1256. fpc_Val_SInt_UnicodeStr := int_Val_SInt_ShortStr(DestSize,SS,Code);
  1257. end;
  1258. end;
  1259. {$ifndef CPU64}
  1260. Function fpc_Val_qword_UnicodeStr (Const S : UnicodeString; out Code : ValSInt): qword; [public, alias:'FPC_VAL_QWORD_UNICODESTR']; compilerproc;
  1261. Var
  1262. SS: ShortString;
  1263. begin
  1264. fpc_Val_qword_UnicodeStr:=0;
  1265. if length(S)>255 then
  1266. code:=256
  1267. else
  1268. begin
  1269. SS:=ShortString(S);
  1270. Val(SS,fpc_Val_qword_UnicodeStr,Code);
  1271. end;
  1272. end;
  1273. Function fpc_Val_int64_UnicodeStr (Const S : UnicodeString; out Code : ValSInt): Int64; [public, alias:'FPC_VAL_INT64_UNICODESTR']; compilerproc;
  1274. Var
  1275. SS: ShortString;
  1276. begin
  1277. fpc_Val_int64_UnicodeStr:=0;
  1278. if length(S)>255 then
  1279. code:=256
  1280. else
  1281. begin
  1282. SS:=ShortString(S);
  1283. Val(SS,fpc_Val_int64_UnicodeStr,Code);
  1284. end;
  1285. end;
  1286. {$endif CPU64}
  1287. {$if defined(CPU16) or defined(CPU8)}
  1288. Function fpc_Val_longword_UnicodeStr (Const S : UnicodeString; out Code : ValSInt): longword; [public, alias:'FPC_VAL_LONGWORD_UNICODESTR']; compilerproc;
  1289. Var
  1290. SS: ShortString;
  1291. begin
  1292. fpc_Val_longword_UnicodeStr:=0;
  1293. if length(S)>255 then
  1294. code:=256
  1295. else
  1296. begin
  1297. SS:=ShortString(S);
  1298. Val(SS,fpc_Val_longword_UnicodeStr,Code);
  1299. end;
  1300. end;
  1301. Function fpc_Val_longint_UnicodeStr (Const S : UnicodeString; out Code : ValSInt): LongInt; [public, alias:'FPC_VAL_LONGINT_UNICODESTR']; compilerproc;
  1302. Var
  1303. SS: ShortString;
  1304. begin
  1305. fpc_Val_longint_UnicodeStr:=0;
  1306. if length(S)>255 then
  1307. code:=256
  1308. else
  1309. begin
  1310. SS:=ShortString(S);
  1311. Val(SS,fpc_Val_longint_UnicodeStr,Code);
  1312. end;
  1313. end;
  1314. Function fpc_Val_word_UnicodeStr (Const S : UnicodeString; out Code : ValSInt): word; [public, alias:'FPC_VAL_WORD_UNICODESTR']; compilerproc;
  1315. Var
  1316. SS: ShortString;
  1317. begin
  1318. fpc_Val_word_UnicodeStr:=0;
  1319. if length(S)>255 then
  1320. code:=256
  1321. else
  1322. begin
  1323. SS:=ShortString(S);
  1324. Val(SS,fpc_Val_word_UnicodeStr,Code);
  1325. end;
  1326. end;
  1327. Function fpc_Val_smallint_UnicodeStr (Const S : UnicodeString; out Code : ValSInt): SmallInt; [public, alias:'FPC_VAL_SMALLINT_UNICODESTR']; compilerproc;
  1328. Var
  1329. SS: ShortString;
  1330. begin
  1331. fpc_Val_smallint_UnicodeStr:=0;
  1332. if length(S)>255 then
  1333. code:=256
  1334. else
  1335. begin
  1336. SS:=ShortString(S);
  1337. Val(SS,fpc_Val_smallint_UnicodeStr,Code);
  1338. end;
  1339. end;
  1340. {$endif CPU16 or CPU8}
  1341. {$ifndef FPUNONE}
  1342. procedure fpc_UnicodeStr_Float(d : ValReal;len,fr,rt : SizeInt;out s : UnicodeString);compilerproc;
  1343. var
  1344. ss: shortstring;
  1345. begin
  1346. str_real(len,fr,d,treal_type(rt),ss);
  1347. s:=UnicodeString(ss);
  1348. end;
  1349. {$endif}
  1350. {$ifndef FPC_STR_ENUM_INTERN}
  1351. procedure fpc_unicodestr_enum(ordinal,len:sizeint;typinfo,ord2strindex:pointer;out s:unicodestring);compilerproc;
  1352. var
  1353. ss: ShortString;
  1354. begin
  1355. fpc_shortstr_enum(ordinal,len,typinfo,ord2strindex,ss);
  1356. s:=UnicodeString(ss);
  1357. end;
  1358. {$endif FPC_STR_ENUM_INTERN}
  1359. procedure fpc_unicodestr_bool(b : boolean;len:sizeint;out s:unicodestring);compilerproc;
  1360. var
  1361. ss: ShortString;
  1362. begin
  1363. fpc_shortstr_bool(b,len,ss);
  1364. s:=UnicodeString(ss);
  1365. end;
  1366. procedure fpc_UnicodeStr_Currency(c : Currency;len,fr : SizeInt;out s : UnicodeString);compilerproc;
  1367. var
  1368. ss: shortstring;
  1369. begin
  1370. str(c:len:fr,ss);
  1371. s:=UnicodeString(ss);
  1372. end;
  1373. Procedure fpc_UnicodeStr_SInt(v : ValSint; Len : SizeInt; out S : UnicodeString);compilerproc;
  1374. Var
  1375. SS: ShortString;
  1376. begin
  1377. Str (v:Len,SS);
  1378. S:=UnicodeString(SS);
  1379. end;
  1380. Procedure fpc_UnicodeStr_UInt(v : ValUInt;Len : SizeInt; out S : UnicodeString);compilerproc;
  1381. Var
  1382. SS: ShortString;
  1383. begin
  1384. str(v:Len,SS);
  1385. S:=UnicodeString(SS);
  1386. end;
  1387. {$ifndef CPU64}
  1388. Procedure fpc_UnicodeStr_Int64(v : Int64; Len : SizeInt; out S : UnicodeString);compilerproc;
  1389. Var
  1390. SS: ShortString;
  1391. begin
  1392. Str (v:Len,SS);
  1393. S:=UnicodeString(SS);
  1394. end;
  1395. Procedure fpc_UnicodeStr_Qword(v : Qword;Len : SizeInt; out S : UnicodeString);compilerproc;
  1396. Var
  1397. SS: ShortString;
  1398. begin
  1399. str(v:Len,SS);
  1400. S:=UnicodeString(SS);
  1401. end;
  1402. {$endif CPU64}
  1403. {$if defined(CPU16) or defined(CPU8)}
  1404. Procedure fpc_UnicodeStr_LongInt(v : LongInt; Len : SizeInt; out S : UnicodeString);compilerproc;
  1405. Var
  1406. SS: ShortString;
  1407. begin
  1408. Str (v:Len,SS);
  1409. S:=UnicodeString(SS);
  1410. end;
  1411. Procedure fpc_UnicodeStr_LongWord(v : LongWord;Len : SizeInt; out S : UnicodeString);compilerproc;
  1412. Var
  1413. SS: ShortString;
  1414. begin
  1415. str(v:Len,SS);
  1416. S:=UnicodeString(SS);
  1417. end;
  1418. Procedure fpc_UnicodeStr_SmallInt(v : SmallInt; Len : SizeInt; out S : UnicodeString);compilerproc;
  1419. Var
  1420. SS: ShortString;
  1421. begin
  1422. Str (v:Len,SS);
  1423. S:=UnicodeString(SS);
  1424. end;
  1425. Procedure fpc_UnicodeStr_Word(v : Word;Len : SizeInt; out S : UnicodeString);compilerproc;
  1426. Var
  1427. SS: ShortString;
  1428. begin
  1429. str(v:Len,SS);
  1430. S:=UnicodeString(SS);
  1431. end;
  1432. {$endif CPU16 or CPU8}
  1433. function UnicodeToUtf8(Dest: PAnsiChar; Source: PUnicodeChar; MaxBytes: SizeInt): SizeInt;{$ifdef SYSTEMINLINE}inline;{$endif}
  1434. begin
  1435. if assigned(Source) then
  1436. Result:=UnicodeToUtf8(Dest,MaxBytes,Source,Length(Source))
  1437. else
  1438. Result:=0;
  1439. end;
  1440. function UnicodeToUtf8(Dest: PAnsiChar; MaxDestBytes: SizeUInt; Source: PUnicodeChar; SourceChars: SizeUInt): SizeUInt;
  1441. {$ifdef EXCLUDE_COMPLEX_PROCS}
  1442. begin
  1443. runerror(217);
  1444. end;
  1445. {$else EXCLUDE_COMPLEX_PROCS}
  1446. var
  1447. i,j : SizeUInt;
  1448. lw : longword;
  1449. begin
  1450. result:=0;
  1451. if source=nil then
  1452. exit;
  1453. i:=0;
  1454. j:=0;
  1455. if assigned(Dest) then
  1456. begin
  1457. while (i<SourceChars) and (j<MaxDestBytes) do
  1458. begin
  1459. lw:=ord(Source[i]);
  1460. case lw of
  1461. 0..$7f:
  1462. begin
  1463. Dest[j]:=AnsiChar(lw);
  1464. inc(j);
  1465. end;
  1466. $80..$7ff:
  1467. begin
  1468. if j+1>=MaxDestBytes then
  1469. break;
  1470. Dest[j]:=AnsiChar($c0 or (lw shr 6));
  1471. Dest[j+1]:=AnsiChar($80 or (lw and $3f));
  1472. inc(j,2);
  1473. end;
  1474. $800..$d7ff,$e000..$ffff:
  1475. begin
  1476. if j+2>=MaxDestBytes then
  1477. break;
  1478. Dest[j]:=AnsiChar($e0 or (lw shr 12));
  1479. Dest[j+1]:=AnsiChar($80 or ((lw shr 6) and $3f));
  1480. Dest[j+2]:=AnsiChar($80 or (lw and $3f));
  1481. inc(j,3);
  1482. end;
  1483. $d800..$dbff:
  1484. {High Surrogates}
  1485. begin
  1486. if j+3>=MaxDestBytes then
  1487. break;
  1488. if (i+1<sourcechars) and
  1489. (word(Source[i+1]) >= $dc00) and
  1490. (word(Source[i+1]) <= $dfff) then
  1491. begin
  1492. { $d7c0 is ($d800 - ($10000 shr 10)) }
  1493. lw:=(longword(lw-$d7c0) shl 10) + (ord(source[i+1]) xor $dc00);
  1494. Dest[j]:=AnsiChar($f0 or (lw shr 18));
  1495. Dest[j+1]:=AnsiChar($80 or ((lw shr 12) and $3f));
  1496. Dest[j+2]:=AnsiChar($80 or ((lw shr 6) and $3f));
  1497. Dest[j+3]:=AnsiChar($80 or (lw and $3f));
  1498. inc(j,4);
  1499. inc(i);
  1500. end;
  1501. end;
  1502. end;
  1503. inc(i);
  1504. end;
  1505. if j>SizeUInt(MaxDestBytes-1) then
  1506. j:=MaxDestBytes-1;
  1507. Dest[j]:=#0;
  1508. end
  1509. else
  1510. begin
  1511. while i<SourceChars do
  1512. begin
  1513. case word(Source[i]) of
  1514. $0..$7f:
  1515. inc(j);
  1516. $80..$7ff:
  1517. inc(j,2);
  1518. $800..$d7ff,$e000..$ffff:
  1519. inc(j,3);
  1520. $d800..$dbff:
  1521. begin
  1522. if (i+1<sourcechars) and
  1523. (word(Source[i+1]) >= $dc00) and
  1524. (word(Source[i+1]) <= $dfff) then
  1525. begin
  1526. inc(j,4);
  1527. inc(i);
  1528. end;
  1529. end;
  1530. end;
  1531. inc(i);
  1532. end;
  1533. end;
  1534. result:=j+1;
  1535. end;
  1536. {$endif EXCLUDE_COMPLEX_PROCS}
  1537. function Utf8ToUnicode(Dest: PUnicodeChar; Source: PAnsiChar; MaxChars: SizeInt): SizeInt;{$ifdef SYSTEMINLINE}inline;{$endif}
  1538. begin
  1539. if assigned(Source) then
  1540. Result:=Utf8ToUnicode(Dest,MaxChars,Source,length(Source),True)
  1541. else
  1542. Result:=0;
  1543. end;
  1544. function UTF8ToUnicode(Dest: PUnicodeChar; MaxDestChars: SizeUInt; Source: PAnsiChar; SourceBytes: SizeUInt): SizeUInt;{$ifdef SYSTEMINLINE}inline;{$endif}
  1545. begin
  1546. Result:=Utf8ToUnicode(Dest,MaxDestChars,Source,SourceBytes,True);
  1547. end;
  1548. function Utf8ToUnicode(Dest: PUnicodeChar; MaxDestChars: SizeUInt; Source: PAnsiChar; SourceBytes: SizeUInt; IgnoreInvalid : Boolean): SizeUInt;
  1549. {$ifdef EXCLUDE_COMPLEX_PROCS}
  1550. begin
  1551. runerror(217);
  1552. end;
  1553. {$else EXCLUDE_COMPLEX_PROCS}
  1554. var
  1555. SourcePos,DestPos: SizeUint;
  1556. UC: int32;
  1557. begin
  1558. if not Assigned(Source) then
  1559. exit(0);
  1560. SourcePos:=0;
  1561. DestPos:=0;
  1562. if Assigned(Dest) then
  1563. begin
  1564. if SourcePos<SourceBytes then { “repeat until false” + “if C then continue else break” is used instead of “while C” + “continue” for better codegen. }
  1565. repeat
  1566. { See generic.inc:Utf8CodePointLen for explanations. Not continuing = invalid or incomplete character. }
  1567. if DestPos>=MaxDestChars then { Speculate 1 unicodechar. }
  1568. break;
  1569. inc(DestPos);
  1570. UC:=ord(Source[SourcePos]);
  1571. case uint32(UC) of
  1572. 0..$7F:
  1573. begin
  1574. Dest[DestPos-1]:=unicodechar(UC);
  1575. inc(SourcePos);
  1576. if SourcePos<SourceBytes then continue else break;
  1577. end;
  1578. $C2..$DF:
  1579. if (SourcePos+1<SourceBytes) and (ord(Source[SourcePos+1]) and $C0=$80) then
  1580. begin
  1581. Dest[DestPos-1]:=unicodechar(UC and $1F shl 6 or ord(Source[SourcePos+1]) and $3F);
  1582. inc(SourcePos,2);
  1583. if SourcePos<SourceBytes then continue else break;
  1584. end;
  1585. $E0..$EF:
  1586. if (SourcePos+2<SourceBytes) and (ord(Source[SourcePos+1]) and $C0=$80) and (ord(Source[SourcePos+2]) and $C0=$80) then
  1587. begin
  1588. UC:=UC and $F shl 12 or ord(Source[SourcePos+1]) and $3F shl 6 or ord(Source[SourcePos+2]) and $3F;
  1589. if (UC>=$800) and (UC<=$FFFD) and not ((UC>=$D800) and (UC<=$DFFF)) then
  1590. begin
  1591. Dest[DestPos-1]:=unicodechar(UC);
  1592. inc(SourcePos,3);
  1593. if SourcePos<SourceBytes then continue else break;
  1594. end;
  1595. end;
  1596. $F0..$F4:
  1597. if (SourcePos+3<SourceBytes) and (ord(Source[SourcePos+1]) and $C0=$80) and (ord(Source[SourcePos+2]) and $C0=$80) and (ord(Source[SourcePos+3]) and $C0=$80) then
  1598. begin
  1599. UC:=UC and $7 shl 18 or ord(Source[SourcePos+1]) and $3F shl 12 or ord(Source[SourcePos+2]) and $3F shl 6 or ord(Source[SourcePos+3]) and $3F-$10000;
  1600. if Cardinal(UC)<=$10FFFF-$10000 then
  1601. begin
  1602. dec(DestPos);
  1603. if DestPos+1>=MaxDestChars then { 2 unicodechars. }
  1604. break;
  1605. Dest[DestPos]:=unicodechar($D800+UC shr 10);
  1606. Dest[DestPos+1]:=unicodechar($DC00+UC and $3ff);
  1607. inc(SourcePos,4);
  1608. inc(DestPos,2);
  1609. if SourcePos<SourceBytes then continue else break;
  1610. end;
  1611. end;
  1612. end;
  1613. { Invalid or incomplete character. }
  1614. if not IgnoreInvalid then
  1615. HandleError(231); // Will be converted to EConversionError in sysutils
  1616. inc(SourcePos); { Skip first byte. }
  1617. if ord(Source[SourcePos-1]) and $C0<>$80 then { If first byte is not a continuation byte... }
  1618. while (SourcePos<SourceBytes) and (ord(Source[SourcePos]) and $C0=$80) do { ..Then skip continuation bytes. }
  1619. inc(SourcePos);
  1620. Dest[DestPos-1]:='?';
  1621. if SourcePos>=SourceBytes then break; { Do not add a condition to the loop, or “continue”s will jump to it instead of the beginning! }
  1622. until false;
  1623. if DestPos<MaxDestChars then { Null-terminate... if there is space. Count in result in either case. }
  1624. Dest[DestPos]:=#0;
  1625. end
  1626. else
  1627. { Same as above but without writing Dest. }
  1628. if SourcePos<SourceBytes then
  1629. repeat
  1630. UC:=ord(Source[SourcePos]);
  1631. inc(DestPos); { Speculate 1 unicodechar. }
  1632. case uint32(UC) of
  1633. 0..$7F:
  1634. begin
  1635. inc(SourcePos);
  1636. if SourcePos<SourceBytes then continue else break;
  1637. end;
  1638. $C2..$DF:
  1639. if (SourcePos+1<SourceBytes) and (ord(Source[SourcePos+1]) and $C0=$80) then
  1640. begin
  1641. inc(SourcePos,2);
  1642. if SourcePos<SourceBytes then continue else break;
  1643. end;
  1644. $E0..$EF:
  1645. if (SourcePos+2<SourceBytes) and (ord(Source[SourcePos+1]) and $C0=$80) and (ord(Source[SourcePos+2]) and $C0=$80) then
  1646. begin
  1647. UC:=UC and $F shl 12 or ord(Source[SourcePos+1]) and $3F shl 6 or ord(Source[SourcePos+2]) and $3F;
  1648. if (UC>=$800) and (UC<=$FFFD) and not ((UC>=$D800) and (UC<=$DFFF)) then
  1649. begin
  1650. inc(SourcePos,3);
  1651. if SourcePos<SourceBytes then continue else break;
  1652. end;
  1653. end;
  1654. $F0..$F4:
  1655. if (SourcePos+3<SourceBytes) and (ord(Source[SourcePos+1]) and $C0=$80) and (ord(Source[SourcePos+2]) and $C0=$80) and (ord(Source[SourcePos+3]) and $C0=$80) then
  1656. begin
  1657. UC:=UC and $7 shl 18 or ord(Source[SourcePos+1]) and $3F shl 12 or ord(Source[SourcePos+2]) and $3F shl 6 or ord(Source[SourcePos+3]) and $3F-$10000;
  1658. if Cardinal(UC)<=$10FFFF-$10000 then
  1659. begin
  1660. inc(SourcePos,4);
  1661. inc(DestPos); { To 2 unicodechars in total. }
  1662. if SourcePos<SourceBytes then continue else break;
  1663. end;
  1664. end;
  1665. end;
  1666. if not IgnoreInvalid then
  1667. HandleError(231);
  1668. inc(SourcePos);
  1669. if ord(Source[SourcePos-1]) and $C0<>$80 then
  1670. while (SourcePos<SourceBytes) and (ord(Source[SourcePos]) and $C0=$80) do
  1671. inc(SourcePos);
  1672. if SourcePos>=SourceBytes then break;
  1673. until false;
  1674. Result:=DestPos+1 {null terminator, in both branches};
  1675. end;
  1676. {$endif EXCLUDE_COMPLEX_PROCS}
  1677. function UTF8Encode(const s : RawByteString) : RawByteString; inline;
  1678. begin
  1679. Result:=UTF8Encode(UnicodeString(s));
  1680. end;
  1681. {$ifndef FPC_HAS_UTF8ENCODE_UNICODESTRING}
  1682. {$define FPC_HAS_UTF8ENCODE_UNICODESTRING}
  1683. function UTF8Encode(const s : UnicodeString) : RawByteString;
  1684. var
  1685. ns : SizeInt;
  1686. begin
  1687. result:='';
  1688. if Length(s)=0 then
  1689. exit;
  1690. ns:=Length(s);
  1691. SetLength(utf8string(result),ns*3);
  1692. SetLength(utf8string(result),UnicodeToUtf8(pointer(result),ns*3+1,pointer(s),ns)-1); { SetLength(-1) is equivalent to SetLength(0). }
  1693. end;
  1694. {$endif FPC_HAS_UTF8ENCODE_UNICODESTRING}
  1695. {$ifndef FPC_HAS_UTF8DECODE_UNICODESTRING}
  1696. {$define FPC_HAS_UTF8DECODE_UNICODESTRING}
  1697. function UTF8Decode(const s : RawByteString): UnicodeString;
  1698. var
  1699. ns : SizeInt;
  1700. begin
  1701. result:='';
  1702. if Length(s)=0 then
  1703. exit;
  1704. ns:=Length(s);
  1705. SetLength(result,ns);
  1706. SetLength(result,Utf8ToUnicode(pointer(result),ns+1,pointer(s),ns)-1);
  1707. end;
  1708. {$endif FPC_HAS_UTF8DECODE_UNICODESTRING}
  1709. function AnsiToUtf8(const s : RawByteString): RawByteString;{$ifdef SYSTEMINLINE}inline;{$endif}
  1710. begin
  1711. Result:=Utf8Encode(s);
  1712. end;
  1713. function Utf8ToAnsi(const s : RawByteString) : RawByteString;{$ifdef SYSTEMINLINE}inline;{$endif}
  1714. begin
  1715. Result:=RawByteString(Utf8Decode(s));
  1716. end;
  1717. {$ifdef FPC_HAS_FEATURE_DYNARRAYS}
  1718. procedure UCS4Encode(p: PWideChar; len: sizeint; out res: UCS4String);
  1719. var
  1720. i, reslen: sizeint;
  1721. w: longint;
  1722. begin
  1723. reslen:=0;
  1724. i:=0;
  1725. { calculate required length }
  1726. while (i<len) do
  1727. begin
  1728. if (p[i]<=#$d7ff) or (p[i]>=#$e000) then
  1729. inc(i)
  1730. else if (p[i]<=#$dbff) and
  1731. (i+1<len) and
  1732. (p[i+1]>=#$dc00) and
  1733. (p[i+1]<=#$dfff) then
  1734. inc(i,2)
  1735. else
  1736. inc(i);
  1737. inc(reslen);
  1738. end;
  1739. SetLength(res,reslen+1); { +1 for null termination }
  1740. reslen:=0;
  1741. i:=0;
  1742. { do conversion }
  1743. while (i<len) do
  1744. begin
  1745. w:=ord(p[i]);
  1746. if (w<=$d7ff) or (w>=$e000) then
  1747. res[reslen]:=w
  1748. else if (w<=$dbff) and
  1749. (i+1<len) and
  1750. (p[i+1]>=#$dc00) and
  1751. (p[i+1]<=#$dfff) then
  1752. begin
  1753. res[reslen]:=(UCS4Char(w-$d7c0) shl 10)+(UCS4Char(p[i+1]) xor $dc00);
  1754. inc(i);
  1755. end
  1756. else { invalid surrogate pair }
  1757. res[reslen]:=w;
  1758. inc(i);
  1759. inc(reslen);
  1760. end;
  1761. res[reslen]:=0;
  1762. end;
  1763. {$ifndef FPC_HAS_UCS4STRING_TO_UNICODESTR}
  1764. {$define FPC_HAS_UCS4STRING_TO_UNICODESTR}
  1765. function UnicodeStringToUCS4String(const s : UnicodeString) : UCS4String;
  1766. begin
  1767. UCS4Encode(PWideChar(s),Length(s),result);
  1768. end;
  1769. {$endif FPC_HAS_UCS4STRING_TO_UNICODESTR}
  1770. {$ifndef FPC_HAS_WIDESTR_TO_UCS4STRING}
  1771. {$define FPC_HAS_WIDESTR_TO_UCS4STRING}
  1772. function WideStringToUCS4String(const s : WideString) : UCS4String;
  1773. begin
  1774. UCS4Encode(PWideChar(s),Length(s),result);
  1775. end;
  1776. {$endif FPC_HAS_WIDESTR_TO_UCS4STRING}
  1777. {$ifndef FPC_HAS_UCS4STRING_TO_WIDESTR}
  1778. {$define FPC_HAS_UCS4STRING_TO_WIDESTR}
  1779. { dest should point to previously allocated wide/unicodestring }
  1780. procedure UCS4Decode(const s: UCS4String; dest: PWideChar);
  1781. var
  1782. i: sizeint;
  1783. nc: UCS4Char;
  1784. begin
  1785. for i:=0 to length(s)-2 do { -2 because s contains explicit terminating #0 }
  1786. begin
  1787. nc:=s[i];
  1788. if (nc<=$ffff) then
  1789. dest^:=widechar(nc)
  1790. else if (dword(nc)<=$10ffff) then
  1791. begin
  1792. dest^:=widechar(nc shr 10 + $d7c0);
  1793. { subtracting $10000 doesn't change low 10 bits }
  1794. dest[1]:=widechar(nc and $3ff + $dc00);
  1795. inc(dest);
  1796. end
  1797. else { invalid code point }
  1798. dest^:='?';
  1799. inc(dest);
  1800. end;
  1801. end;
  1802. function UCS4StringToUnicodeString(const s : UCS4String) : UnicodeString;
  1803. var
  1804. i : SizeInt;
  1805. reslen : SizeInt;
  1806. begin
  1807. reslen:=0;
  1808. for i:=0 to length(s)-2 do { skip terminating #0 }
  1809. Inc(reslen,1+ord((s[i]>$ffff) and (cardinal(s[i])<=$10ffff)));
  1810. SetLength(result,reslen);
  1811. UCS4Decode(s,pointer(result));
  1812. end;
  1813. function UCS4StringToWideString(const s : UCS4String) : WideString;
  1814. var
  1815. i : SizeInt;
  1816. reslen : SizeInt;
  1817. begin
  1818. reslen:=0;
  1819. for i:=0 to length(s)-2 do { skip terminating #0 }
  1820. Inc(reslen,1+ord((s[i]>$ffff) and (cardinal(s[i])<=$10ffff)));
  1821. SetLength(result,reslen);
  1822. UCS4Decode(s,pointer(result));
  1823. end;
  1824. {$endif FPC_HAS_UCS4STRING_TO_WIDESTR}
  1825. {$endif FPC_HAS_FEATURE_DYNARRAYS}
  1826. {$ifndef FPC_HAS_BUILTIN_WIDESTR_MANAGER}
  1827. const
  1828. SNoUnicodestrings = 'This binary has no string conversion support compiled in.';
  1829. SRecompileWithUnicodestrings = 'Recompile the application with a unit that installs a unicodestring manager in the program uses clause.';
  1830. procedure unimplementedunicodestring;
  1831. begin
  1832. {$ifdef FPC_HAS_FEATURE_CONSOLEIO}
  1833. {$ifndef HAS_WIDESTRINGMANAGER}
  1834. {$ifndef FPC_SYSTEM_NO_VERBOSE_UNICODEERROR}
  1835. If IsConsole then
  1836. begin
  1837. Writeln(StdErr,SNoUnicodestrings);
  1838. Writeln(StdErr,SRecompileWithUnicodestrings);
  1839. end;
  1840. {$endif FPC_SYSTEM_NO_VERBOSE_UNICODEERROR}
  1841. {$endif HAS_WIDESTRINGMANAGER}
  1842. {$endif FPC_HAS_FEATURE_CONSOLEIO}
  1843. HandleErrorAddrFrameInd(234{RuntimeErrorExitCodes[reCodesetConversion]},get_pc_addr,get_frame);
  1844. end;
  1845. function StringElementSize(const S: UnicodeString): Word; overload;
  1846. begin
  1847. if assigned(Pointer(S)) then
  1848. Result:=PUnicodeRec(pointer(S)-UnicodeFirstOff)^.ElementSize
  1849. else
  1850. Result:=SizeOf(UnicodeChar);
  1851. end;
  1852. function StringRefCount(const S: UnicodeString): SizeInt; overload;
  1853. begin
  1854. if assigned(Pointer(S)) then
  1855. Result:=PUnicodeRec(pointer(S)-UnicodeFirstOff)^.Ref
  1856. else
  1857. Result:=0;
  1858. end;
  1859. function StringCodePage(const S: UnicodeString): TSystemCodePage; overload;
  1860. begin
  1861. if assigned(Pointer(S)) then
  1862. Result:=PUnicodeRec(pointer(S)-UnicodeFirstOff)^.CodePage
  1863. else
  1864. Result:=DefaultUnicodeCodePage;
  1865. end;
  1866. {$push}
  1867. {$warnings off}
  1868. function StubUnicodeCase(const s : UnicodeString) : UnicodeString;
  1869. begin
  1870. unimplementedunicodestring;
  1871. end;
  1872. function StubCompareUnicodeString(const s1, s2 : UnicodeString; Options : TCompareOptions) : PtrInt;
  1873. begin
  1874. unimplementedunicodestring;
  1875. end;
  1876. function StubWideCase(const s: WideString): WideString;
  1877. begin
  1878. unimplementedunicodestring;
  1879. end;
  1880. function StubCompareWideString(const s1, s2 : WideString; Options : TCompareOptions) : PtrInt;
  1881. begin
  1882. unimplementedunicodestring;
  1883. end;
  1884. {$pop}
  1885. procedure initunicodestringmanager;
  1886. begin
  1887. {$ifndef HAS_WIDESTRINGMANAGER}
  1888. widestringmanager:=Default(TUnicodeStringManager);
  1889. {$ifdef FPC_WIDESTRING_EQUAL_UNICODESTRING}
  1890. widestringmanager.Ansi2WideMoveProc:=@defaultAnsi2UnicodeMove;
  1891. {$else FPC_WIDESTRING_EQUAL_UNICODESTRING}
  1892. widestringmanager.Ansi2WideMoveProc:=@DefaultAnsi2WideMove;
  1893. {$endif FPC_WIDESTRING_EQUAL_UNICODESTRING}
  1894. widestringmanager.Wide2AnsiMoveProc:=@DefaultUnicode2AnsiMove;
  1895. widestringmanager.UpperWideStringProc:=@StubWideCase;
  1896. widestringmanager.LowerWideStringProc:=@StubWideCase;
  1897. widestringmanager.Unicode2AnsiMoveProc:=@DefaultUnicode2AnsiMove;
  1898. widestringmanager.Ansi2UnicodeMoveProc:=@DefaultAnsi2UnicodeMove;
  1899. widestringmanager.UpperUnicodeStringProc:=@StubUnicodeCase;
  1900. widestringmanager.LowerUnicodeStringProc:=@StubUnicodeCase;
  1901. widestringmanager.GetStandardCodePageProc:=@DefaultGetStandardCodePage;
  1902. {$endif HAS_WIDESTRINGMANAGER}
  1903. widestringmanager.CompareWideStringProc:=@StubCompareWideString;
  1904. // widestringmanager.CompareTextWideStringProc:=@StubCompareWideString;
  1905. widestringmanager.CompareUnicodeStringProc:=@StubCompareUnicodeString;
  1906. widestringmanager.CharLengthPCharProc:=@DefaultCharLengthPChar;
  1907. widestringmanager.CodePointLengthProc:=@DefaultCodePointLength;
  1908. end;
  1909. {$endif FPC_HAS_BUILTIN_WIDESTR_MANAGER}
  1910. {$ifndef FPC_HAS_TOSINGLEBYTEFILESYSTEMENCODEDFILENAME_UNICODESTRING}
  1911. {$define FPC_HAS_TOSINGLEBYTEFILESYSTEMENCODEDFILENAME_UNICODESTRING}
  1912. Function ToSingleByteFileSystemEncodedFileName(const Str: UnicodeString): RawByteString;
  1913. Begin
  1914. widestringmanager.Unicode2AnsiMoveProc(punicodechar(Str),Result,
  1915. DefaultFileSystemCodePage,Length(Str));
  1916. End;
  1917. {$endif FPC_HAS_TOSINGLEBYTEFILESYSTEMENCODEDFILENAME_UNICODESTRING}
  1918. {$ifndef FPC_HAS_TOSINGLEBYTEFILESYSTEMENCODEDFILENAME_UNICODECHARARRAY}
  1919. {$define FPC_HAS_TOSINGLEBYTEFILESYSTEMENCODEDFILENAME_UNICODECHARARRAY}
  1920. Function ToSingleByteFileSystemEncodedFileName(const arr: array of widechar): RawByteString;
  1921. Begin
  1922. widestringmanager.Unicode2AnsiMoveProc(@arr[0],Result,
  1923. DefaultFileSystemCodePage,length(pwidechar(@arr[0])));
  1924. End;
  1925. {$endif FPC_HAS_TOSINGLEBYTEFILESYSTEMENCODEDFILENAME_UNICODECHARARRAY}
  1926. Function ToSingleByteFileSystemEncodedFileName(const Str: RawByteString): RawByteString;
  1927. Begin
  1928. Result:=Str;
  1929. SetCodePage(Result,DefaultFileSystemCodePage,True);
  1930. End;
  1931. { Delphi compatibility: always interpret the data in the string as UTF-8,
  1932. ignore any codepage }
  1933. function UTF8ToString(const S: RawByteString): UnicodeString; inline;
  1934. begin
  1935. Result := UTF8Decode(S);
  1936. end;
  1937. function UTF8ToUnicodeString(const s : RawByteString): UnicodeString;
  1938. begin
  1939. Result := UTF8Decode(S);
  1940. end;
  1941. function UTF8ToString(const S: ShortString): UnicodeString;
  1942. Var
  1943. rs: RawByteString;
  1944. begin
  1945. rs:=S;
  1946. Result := UTF8Decode(rs);
  1947. end;
  1948. function UTF8ToUnicodeString(const S: ShortString): unicodestring;
  1949. begin
  1950. Result:=UTF8ToString(S);
  1951. end;
  1952. function UTF8ToString(const S: PAnsiChar): UnicodeString;
  1953. var
  1954. rs: RawByteString;
  1955. Count: SizeInt;
  1956. begin
  1957. Count := length(S);
  1958. SetLength(rs, Count);
  1959. if Count > 0 then
  1960. fpc_pchar_ansistr_intern_charmove(S,0,rs,0,Count);
  1961. Result := UTF8ToString(rs);
  1962. end;
  1963. function UTF8ToUnicodeString(const S: PAnsiChar): unicodestring;
  1964. begin
  1965. Result:=UTF8ToString(S);
  1966. end;
  1967. { byte and ansichar are the same on the JVM, and "array of" and "pointer to"
  1968. are as well }
  1969. {$ifndef CPUJVM}
  1970. function UTF8ToString(const S: array of AnsiChar): UnicodeString;
  1971. var
  1972. rs: RawByteString;
  1973. Count: SizeInt;
  1974. begin
  1975. Count := Length(S);
  1976. SetLength(rs, Count);
  1977. if Count > 0 then
  1978. fpc_pchar_ansistr_intern_charmove(@S,Low(S),rs,0,Count);
  1979. Result := UTF8ToString(rs);
  1980. end;
  1981. function UTF8ToString(const S: array of Byte): UnicodeString;
  1982. var
  1983. rs: RawByteString;
  1984. Count: SizeInt;
  1985. begin
  1986. Count := Length(S);
  1987. SetLength(rs, Count);
  1988. if Count > 0 then
  1989. fpc_pchar_ansistr_intern_charmove(pansichar(@S),Low(S),rs,0,Count);
  1990. Result := UTF8ToString(rs);
  1991. end;
  1992. {$endif not CPUJVM}
  1993. Function LocaleNameToCodePage(const localename : shortstring; out codepage : TSystemCodePage) : Boolean;
  1994. begin
  1995. Result:=(localename='UTF-8') or (localename='UTF8');
  1996. if Result then
  1997. CodePage:=CP_UTF8
  1998. else
  1999. begin
  2000. Result:=(localename='UTF-7') or (localename='UTF7');
  2001. if Result then
  2002. CodePage:=CP_UTF7
  2003. else
  2004. begin
  2005. Result:=Assigned(LocaleNameToCodePageCallBack);
  2006. If Result then
  2007. LocaleNameToCodePageCallBack(LocaleName,CodePage,Result);
  2008. end;
  2009. end;
  2010. end;