cwstring.pp 6.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270
  1. {
  2. This file is part of the Free Pascal run time library.
  3. Copyright (c) 2005 by Florian Klaempfl,
  4. member of the Free Pascal development team.
  5. libc based wide string support
  6. See the file COPYING.FPC, included in this distribution,
  7. for details about the copyright.
  8. This program is distributed in the hope that it will be useful,
  9. but WITHOUT ANY WARRANTY; without even the implied warranty of
  10. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
  11. **********************************************************************}
  12. {$mode objfpc}
  13. unit cwstring;
  14. interface
  15. procedure SetCWidestringManager;
  16. implementation
  17. {$linklib c}
  18. {$ifdef bsd}
  19. {$linklib iconv}
  20. {$endif bsd}
  21. Uses
  22. BaseUnix,
  23. ctypes,
  24. unix,
  25. unixtype,
  26. sysutils,
  27. initc;
  28. Const
  29. libiconvname='iconv';
  30. { Case-mapping "arrays" }
  31. var
  32. AnsiUpperChars: AnsiString; // 1..255
  33. AnsiLowerChars: AnsiString; // 1..255
  34. WideUpperChars: WideString; // 1..65535
  35. WideLowerChars: WideString; // 1..65535
  36. { the following declarations are from the libc unit for linux so they
  37. might be very linux centric
  38. maybe this needs to be splitted in an os depend way later }
  39. function towlower(__wc:wint_t):wint_t;cdecl;external;
  40. function towupper(__wc:wint_t):wint_t;cdecl;external;
  41. function wcscoll(__s1:pwchar_t; __s2:pwchar_t):longint;cdecl;external;
  42. const
  43. {$ifdef linux}
  44. __LC_CTYPE = 0;
  45. _NL_CTYPE_CLASS = (__LC_CTYPE shl 16);
  46. _NL_CTYPE_CODESET_NAME = (_NL_CTYPE_CLASS)+14;
  47. CODESET = _NL_CTYPE_CODESET_NAME;
  48. {$else linux}
  49. {$ifdef darwin}
  50. CODESET = 0;
  51. {$else darwin}
  52. {$ifdef FreeBSD} // actually FreeBSD5. internationalisation is afaik not default on 4.
  53. CODESET = 0;
  54. {$else freebsd}
  55. {$error lookup the value of CODESET in /usr/include/langinfo.h for your OS }
  56. {$endif FreeNSD}
  57. {$endif darwin}
  58. {$endif linux}
  59. { unicode encoding name }
  60. {$ifdef FPC_LITTLE_ENDIAN}
  61. unicode_encoding = 'UNICODELITTLE';
  62. {$else FPC_LITTLE_ENDIAN}
  63. unicode_encoding = 'UNICODEBIG';
  64. {$endif FPC_LITTLE_ENDIAN}
  65. type
  66. piconv_t = ^iconv_t;
  67. iconv_t = pointer;
  68. nl_item = longint;
  69. function nl_langinfo(__item:nl_item):pchar;cdecl;external libiconvname name 'nl_langinfo';
  70. {$ifndef Darwin}
  71. function iconv_open(__tocode:pchar; __fromcode:pchar):iconv_t;cdecl;external libiconvname name 'iconv_open';
  72. function iconv(__cd:iconv_t; __inbuf:ppchar; __inbytesleft:psize_t; __outbuf:ppchar; __outbytesleft:psize_t):size_t;cdecl;external libiconvname name 'iconv';
  73. function iconv_close(__cd:iconv_t):longint;cdecl;external libiconvname name 'iconv_close';
  74. {$else}
  75. function iconv_open(__tocode:pchar; __fromcode:pchar):iconv_t;cdecl;external libiconvname name 'libiconv_open';
  76. function iconv(__cd:iconv_t; __inbuf:ppchar; __inbytesleft:psize_t; __outbuf:ppchar; __outbytesleft:psize_t):size_t;cdecl;external libiconvname name 'libiconv';
  77. function iconv_close(__cd:iconv_t):longint;cdecl;external libiconvname name 'libiconv_close';
  78. {$endif}
  79. var
  80. iconv_ansi2wide,
  81. iconv_wide2ansi : iconv_t;
  82. procedure Wide2AnsiMove(source:pwidechar;var dest:ansistring;len:SizeInt);
  83. var
  84. outlength,
  85. outoffset,
  86. srclen,
  87. outleft : size_t;
  88. srcpos : pwidechar;
  89. destpos: pchar;
  90. mynil : pchar;
  91. my0 : size_t;
  92. begin
  93. mynil:=nil;
  94. my0:=0;
  95. { rought estimation }
  96. setlength(dest,len*3);
  97. outlength:=len*3;
  98. srclen:=len*2;
  99. srcpos:=source;
  100. destpos:=pchar(dest);
  101. outleft:=outlength;
  102. while iconv(iconv_wide2ansi,@srcpos,@srclen,@destpos,@outleft)=size_t(-1) do
  103. begin
  104. case fpgetCerrno of
  105. ESysEILSEQ:
  106. begin
  107. { skip and set to '?' }
  108. inc(srcpos);
  109. dec(srclen,2);
  110. destpos^:='?';
  111. inc(destpos);
  112. dec(outleft);
  113. { reset }
  114. iconv(iconv_wide2ansi,@mynil,@my0,@mynil,@my0);
  115. end;
  116. ESysE2BIG:
  117. begin
  118. outoffset:=destpos-pchar(dest);
  119. { extend }
  120. setlength(dest,outlength+len*3);
  121. inc(outleft,len*3);
  122. inc(outlength,len*3);
  123. { string could have been moved }
  124. destpos:=pchar(dest)+outoffset;
  125. end;
  126. else
  127. raise EConvertError.Create('iconv error');
  128. end;
  129. end;
  130. // truncate string
  131. setlength(dest,length(dest)-outleft);
  132. end;
  133. procedure Ansi2WideMove(source:pchar;var dest:widestring;len:SizeInt);
  134. var
  135. outlength,
  136. outoffset,
  137. outleft : size_t;
  138. srcpos,
  139. destpos: pchar;
  140. mynil : pchar;
  141. my0 : size_t;
  142. begin
  143. mynil:=nil;
  144. my0:=0;
  145. // extra space
  146. outlength:=len+1;
  147. setlength(dest,outlength);
  148. outlength:=len+1;
  149. srcpos:=source;
  150. destpos:=pchar(dest);
  151. outleft:=outlength*2;
  152. while iconv(iconv_ansi2wide,@srcpos,@len,@destpos,@outleft)=size_t(-1) do
  153. begin
  154. case fpgetCerrno of
  155. ESysE2BIG:
  156. begin
  157. outoffset:=destpos-pchar(dest);
  158. { extend }
  159. setlength(dest,outlength+len);
  160. inc(outleft,len*2);
  161. inc(outlength,len);
  162. { string could have been moved }
  163. destpos:=pchar(dest)+outoffset;
  164. end;
  165. else
  166. raise EConvertError.Create('iconv error');
  167. end;
  168. end;
  169. // truncate string
  170. setlength(dest,length(dest)-outleft div 2);
  171. end;
  172. function LowerWideString(const s : WideString) : WideString;
  173. var
  174. i : SizeInt;
  175. begin
  176. SetLength(result,length(s));
  177. for i:=1 to length(s) do
  178. result[i]:=WideChar(towlower(wint_t(s[i])));
  179. end;
  180. function UpperWideString(const s : WideString) : WideString;
  181. var
  182. i : SizeInt;
  183. begin
  184. SetLength(result,length(s));
  185. for i:=1 to length(s) do
  186. result[i]:=WideChar(towupper(wint_t(s[i])));
  187. end;
  188. function CompareWideString(const s1, s2 : WideString) : PtrInt;
  189. begin
  190. end;
  191. function CompareTextWideString(const s1, s2 : WideString): PtrInt;
  192. begin
  193. end;
  194. Var
  195. CWideStringManager : TWideStringManager;
  196. Procedure SetCWideStringManager;
  197. begin
  198. CWideStringManager:=widestringmanager;
  199. With CWideStringManager do
  200. begin
  201. Wide2AnsiMoveProc:=@Wide2AnsiMove;
  202. Ansi2WideMoveProc:=@Ansi2WideMove;
  203. UpperWideStringProc:=@UpperWideString;
  204. LowerWideStringProc:=@LowerWideString;
  205. {
  206. CompareWideStringProc
  207. CompareTextWideStringProc
  208. CharLengthPCharProc
  209. UpperAnsiStringProc
  210. LowerAnsiStringProc
  211. CompareStrAnsiStringProc
  212. CompareTextAnsiStringProc
  213. StrCompAnsiStringProc
  214. StrICompAnsiStringProc
  215. StrLCompAnsiStringProc
  216. StrLICompAnsiStringProc
  217. StrLowerAnsiStringProc
  218. StrUpperAnsiStringProc
  219. }
  220. end;
  221. SetWideStringManager(CWideStringManager);
  222. end;
  223. initialization
  224. SetCWideStringManager;
  225. { init conversion tables }
  226. iconv_wide2ansi:=iconv_open(nl_langinfo(CODESET),unicode_encoding);
  227. iconv_ansi2wide:=iconv_open(unicode_encoding,nl_langinfo(CODESET));
  228. finalization
  229. iconv_close(iconv_ansi2wide);
  230. end.