winiconv.inc 19 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408
  1. { source: http://win-iconv.googlecode.com/svn-history/r6/trunk/win_iconv.c
  2. public domain
  3. }
  4. type
  5. twin2iconv = record
  6. cp: word;
  7. name: rawbytestring; { for null-termination }
  8. end;
  9. (*
  10. * Code Page Identifiers
  11. * http://msdn2.microsoft.com/en-us/library/ms776446.aspx
  12. *)
  13. const
  14. win2iconv_arr: array[0..319] of twin2iconv =
  15. ((cp:37; name:'IBM037'), (* IBM EBCDIC US-Canada *)
  16. (cp:154; name:'CP154'),
  17. (cp:154; name:'CYRILLIC-ASIAN'),
  18. (cp:154; name:'PT154'),
  19. (cp:154; name:'PTCP154'),
  20. (cp:154; name:'CSPTCP154'),
  21. (cp:437; name:'437'),
  22. (cp:437; name:'CP437'),
  23. (cp:437; name:'IBM437'),
  24. (cp:437; name:'CSPC8CODEPAGE437'),
  25. (cp:437; name:'IBM437'), (* OEM United States *)
  26. (cp:500; name:'IBM500'), (* IBM EBCDIC International *)
  27. (cp:708; name:'ASMO-708'), (* Arabic (ASMO 708) *)
  28. (cp:720; name:'DOS-720'), (* Arabic (Transparent ASMO); Arabic (DOS) *)
  29. (cp:737; name:'CP737'),
  30. (cp:737; name:'ibm737'), (* OEM Greek (formerly 437G); Greek (DOS) *)
  31. (cp:775; name:'CP775'),
  32. (cp:775; name:'IBM775'),
  33. (cp:775; name:'CSPC775BALTIC'),
  34. (cp:775; name:'ibm775'), (* OEM Baltic; Baltic (DOS) *)
  35. (cp:850; name:'850'),
  36. (cp:850; name:'CP850'),
  37. (cp:850; name:'IBM850'),
  38. (cp:850; name:'CSPC850MULTILINGUAL'),
  39. (cp:850; name:'ibm850'), (* OEM Multilingual Latin 1; Western European (DOS) *)
  40. (cp:852; name:'852'),
  41. (cp:852; name:'CP852'),
  42. (cp:852; name:'IBM852'),
  43. (cp:852; name:'CSPCP852'),
  44. (cp:852; name:'ibm852'), (* OEM Latin 2; Central European (DOS) *)
  45. (cp:853; name:'CP853'),
  46. (cp:855; name:'855'),
  47. (cp:855; name:'CP855'),
  48. (cp:855; name:'IBM855'),
  49. (cp:855; name:'CSIBM855'),
  50. (cp:855; name:'IBM855'), (* OEM Cyrillic (primarily Russian) *)
  51. (cp:857; name:'857'),
  52. (cp:857; name:'CP857'),
  53. (cp:857; name:'IBM857'),
  54. (cp:857; name:'CSIBM857'),
  55. (cp:857; name:'ibm857'), (* OEM Turkish; Turkish (DOS) *)
  56. (cp:858; name:'CP858'),
  57. (cp:858; name:'IBM00858'), (* OEM Multilingual Latin 1 + Euro symbol *)
  58. (cp:860; name:'860'),
  59. (cp:860; name:'CP860'),
  60. (cp:860; name:'IBM860'),
  61. (cp:860; name:'CSIBM860'),
  62. (cp:860; name:'IBM860'), (* OEM Portuguese; Portuguese (DOS) *)
  63. (cp:861; name:'861'),
  64. (cp:861; name:'CP-IS'),
  65. (cp:861; name:'CP861'),
  66. (cp:861; name:'IBM861'),
  67. (cp:861; name:'CSIBM861'),
  68. (cp:861; name:'ibm861'), (* OEM Icelandic; Icelandic (DOS) *)
  69. (cp:862; name:'862'),
  70. (cp:862; name:'CP862'),
  71. (cp:862; name:'IBM862'),
  72. (cp:862; name:'CSPC862LATINHEBREW'),
  73. (cp:862; name:'DOS-862'), (* OEM Hebrew; Hebrew (DOS) *)
  74. (cp:863; name:'863'),
  75. (cp:863; name:'CP863'),
  76. (cp:863; name:'IBM863'),
  77. (cp:863; name:'CSIBM863'),
  78. (cp:863; name:'IBM863'), (* OEM French Canadian; French Canadian (DOS) *)
  79. (cp:864; name:'CP864'),
  80. (cp:864; name:'IBM864'),
  81. (cp:864; name:'CSIBM864'),
  82. (cp:864; name:'IBM864'), (* OEM Arabic; Arabic (864) *)
  83. (cp:865; name:'865'),
  84. (cp:865; name:'CP865'),
  85. (cp:865; name:'IBM865'),
  86. (cp:865; name:'CSIBM865'),
  87. (cp:865; name:'IBM865'), (* OEM Nordic; Nordic (DOS) *)
  88. (cp:866; name:'866'),
  89. (cp:866; name:'CP866'),
  90. (cp:866; name:'IBM866'),
  91. (cp:866; name:'CSIBM866'),
  92. (cp:866; name:'cp866'), (* OEM Russian; Cyrillic (DOS) *)
  93. (cp:869; name:'869'),
  94. (cp:869; name:'CP-GR'),
  95. (cp:869; name:'CP869'),
  96. (cp:869; name:'IBM869'),
  97. (cp:869; name:'CSIBM869'),
  98. (cp:869; name:'ibm869'), (* OEM Modern Greek; Greek, Modern (DOS) *)
  99. (cp:870; name:'IBM870'), (* IBM EBCDIC Multilingual/ROECE (Latin 2); IBM EBCDIC Multilingual Latin 2 *)
  100. (cp:874; name:'CP874'),
  101. (cp:874; name:'WINDOWS-874'),
  102. (cp:874; name:'windows-874'), (* ANSI/OEM Thai (same as 28605, ISO 8859-15); Thai (Windows) *)
  103. (cp:875; name:'cp875'), (* IBM EBCDIC Greek Modern *)
  104. (cp:932; name:'CP932'),
  105. (cp:932; name:'MS932'),
  106. (cp:932; name:'SHIFFT_JIS'),
  107. (cp:932; name:'SHIFFT_JIS-MS'),
  108. (cp:932; name:'SJIS'),
  109. (cp:932; name:'SJIS-MS'),
  110. (cp:932; name:'SJIS-OPEN'),
  111. (cp:932; name:'SJIS-WIN'),
  112. (cp:932; name:'WINDOWS-31J'),
  113. (cp:932; name:'WINDOWS-932'),
  114. (cp:932; name:'CSWINDOWS31J'),
  115. (cp:932; name:'shift_jis'), (* ANSI/OEM Japanese; Japanese (Shift-JIS) *)
  116. (cp:932; name:'shift-jis'), (* alternative name for it *)
  117. (cp:936; name:'CP936'),
  118. (cp:936; name:'GBK'),
  119. (cp:936; name:'MS936'),
  120. (cp:936; name:'WINDOWS-936'),
  121. (cp:936; name:'gb2312'), (* ANSI/OEM Simplified Chinese (PRC, Singapore); Chinese Simplified (GB2312) *)
  122. (cp:949; name:'CP949'),
  123. (cp:949; name:'UHC'),
  124. (cp:949; name:'EUC-KR'),
  125. (cp:949; name:'ks_c_5601-1987'), (* ANSI/OEM Korean (Unified Hangul Code) *)
  126. (cp:950; name:'CP950'),
  127. (cp:950; name:'BIG5'),
  128. (cp:950; name:'big5'), (* ANSI/OEM Traditional Chinese (Taiwan; Hong Kong SAR, PRC); Chinese Traditional (Big5) *)
  129. (cp:1026; name:'IBM1026'), (* IBM EBCDIC Turkish (Latin 5) *)
  130. (cp:1047; name:'IBM01047'), (* IBM EBCDIC Latin 1/Open System *)
  131. (cp:1125; name:'CP1125'),
  132. (cp:1133; name:'CP1133'),
  133. (cp:1133; name:'IBM-CP1133'),
  134. (cp:1140; name:'IBM01140'), (* IBM EBCDIC US-Canada (037 + Euro symbol); IBM EBCDIC (US-Canada-Euro) *)
  135. (cp:1141; name:'IBM01141'), (* IBM EBCDIC Germany (20273 + Euro symbol); IBM EBCDIC (Germany-Euro) *)
  136. (cp:1142; name:'IBM01142'), (* IBM EBCDIC Denmark-Norway (20277 + Euro symbol); IBM EBCDIC (Denmark-Norway-Euro) *)
  137. (cp:1143; name:'IBM01143'), (* IBM EBCDIC Finland-Sweden (20278 + Euro symbol); IBM EBCDIC (Finland-Sweden-Euro) *)
  138. (cp:1144; name:'IBM01144'), (* IBM EBCDIC Italy (20280 + Euro symbol); IBM EBCDIC (Italy-Euro) *)
  139. (cp:1145; name:'IBM01145'), (* IBM EBCDIC Latin America-Spain (20284 + Euro symbol); IBM EBCDIC (Spain-Euro) *)
  140. (cp:1146; name:'IBM01146'), (* IBM EBCDIC United Kingdom (20285 + Euro symbol); IBM EBCDIC (UK-Euro) *)
  141. (cp:1147; name:'IBM01147'), (* IBM EBCDIC France (20297 + Euro symbol); IBM EBCDIC (France-Euro) *)
  142. (cp:1148; name:'IBM01148'), (* IBM EBCDIC International (500 + Euro symbol); IBM EBCDIC (International-Euro) *)
  143. (cp:1149; name:'IBM01149'), (* IBM EBCDIC Icelandic (20871 + Euro symbol); IBM EBCDIC (Icelandic-Euro) *)
  144. (cp:1200; name:'UTF-16LE'),
  145. (cp:1200; name:'UTF16LE'),
  146. (cp:1200; name:'UCS-2LE'),
  147. (cp:1200; name:'CP1200'),
  148. {$ifdef FPC_LITTLE_ENDIAN}
  149. (* Default is little endian, because the platform is *)
  150. (cp:1200; name:'UTF16'),
  151. (cp:1200; name:'UTF-16'),
  152. (cp:1200; name:'UCS-2'),
  153. {$endif}
  154. (cp:1201; name:'UTF-16BE'),
  155. (cp:1201; name:'UTF16BE'),
  156. (cp:1201; name:'UCS-2BE'),
  157. (cp:1201; name:'unicodeFFFE'),
  158. (cp:1201; name:'CP1201'),
  159. {$ifdef FPC_BIG_ENDIAN}
  160. (*
  161. * Default is big endian.
  162. * See rfc2781 4.3 Interpreting text labelled as UTF-16.
  163. *)
  164. (cp:1201; name:'UTF16'),
  165. (cp:1201; name:'UTF-16'),
  166. (cp:1201; name:'UCS-2'),
  167. {$endif}
  168. (cp:1250; name:'CP1250'),
  169. (cp:1250; name:'MS-EE'),
  170. (cp:1250; name:'WINDOWS-1250'),
  171. (cp:1250; name:'windows-1250'), (* ANSI Central European; Central European (Windows) *)
  172. (cp:1251; name:'CP1251'),
  173. (cp:1251; name:'MS-CYRL'),
  174. (cp:1251; name:'WINDOWS-1251'),
  175. (cp:1251; name:'windows-1251'), (* ANSI Cyrillic; Cyrillic (Windows) *)
  176. (cp:1252; name:'CP819'),
  177. (cp:1252; name:'IBM819'),
  178. (cp:1252; name:'CP1252'),
  179. (cp:1252; name:'MS-ANSI'),
  180. (cp:1252; name:'WINDOWS-1252'),
  181. (cp:1252; name:'windows-1252'), (* ANSI Latin 1; Western European (Windows) *)
  182. (cp:1253; name:'CP1253'),
  183. (cp:1253; name:'MS-GREEK'),
  184. (cp:1253; name:'WINDOWS-1253'),
  185. (cp:1253; name:'windows-1253'), (* ANSI Greek; Greek (Windows) *)
  186. (cp:1254; name:'CP1254'),
  187. (cp:1254; name:'MS-TURK'),
  188. (cp:1254; name:'WINDOWS-1254'),
  189. (cp:1254; name:'windows-1254'), (* ANSI Turkish; Turkish (Windows) *)
  190. (cp:1255; name:'CP1255'),
  191. (cp:1255; name:'MS-HEBR'),
  192. (cp:1255; name:'WINDOWS-1255'),
  193. (cp:1255; name:'windows-1255'), (* ANSI Hebrew; Hebrew (Windows) *)
  194. (cp:1256; name:'CP1256'),
  195. (cp:1256; name:'MS-ARAB'),
  196. (cp:1256; name:'WINDOWS-1256'),
  197. (cp:1256; name:'windows-1256'), (* ANSI Arabic; Arabic (Windows) *)
  198. (cp:1257; name:'CP1257'),
  199. (cp:1257; name:'WINBALTRIM'),
  200. (cp:1257; name:'WINDOWS-1257'),
  201. (cp:1257; name:'windows-1257'), (* ANSI Baltic; Baltic (Windows) *)
  202. (cp:1258; name:'CP1258'),
  203. (cp:1258; name:'WINDOWS-1258'),
  204. (cp:1258; name:'windows-1258'), (* ANSI/OEM Vietnamese; Vietnamese (Windows) *)
  205. (cp:1361; name:'CP1361'),
  206. (cp:1361; name:'JOHAB'),
  207. (cp:1361; name:'Johab'), (* Korean (Johab) *)
  208. (cp:10000; name:'macintosh'), (* MAC Roman; Western European (Mac) *)
  209. (cp:10001; name:'x-mac-japanese'), (* Japanese (Mac) *)
  210. (cp:10002; name:'x-mac-chinesetrad'), (* MAC Traditional Chinese (Big5); Chinese Traditional (Mac) *)
  211. (cp:10003; name:'x-mac-korean'), (* Korean (Mac) *)
  212. (cp:10004; name:'x-mac-arabic'), (* Arabic (Mac) *)
  213. (cp:10005; name:'x-mac-hebrew'), (* Hebrew (Mac) *)
  214. (cp:10006; name:'x-mac-greek'), (* Greek (Mac) *)
  215. (cp:10007; name:'x-mac-cyrillic'), (* Cyrillic (Mac) *)
  216. (cp:10008; name:'x-mac-chinesesimp'), (* MAC Simplified Chinese (GB 2312); Chinese Simplified (Mac) *)
  217. (cp:10010; name:'x-mac-romanian'), (* Romanian (Mac) *)
  218. (cp:10017; name:'x-mac-ukrainian'), (* Ukrainian (Mac) *)
  219. (cp:10021; name:'x-mac-thai'), (* Thai (Mac) *)
  220. (cp:10029; name:'x-mac-ce'), (* MAC Latin 2; Central European (Mac) *)
  221. (cp:10079; name:'x-mac-icelandic'), (* Icelandic (Mac) *)
  222. (cp:10081; name:'x-mac-turkish'), (* Turkish (Mac) *)
  223. (cp:10082; name:'x-mac-croatian'), (* Croatian (Mac) *)
  224. (cp:12000; name:'UTF-32LE'),
  225. (cp:12000; name:'CP12000'),
  226. (cp:12000; name:'UTF32LE'),
  227. {$ifdef FPC_LITTLE_ENDIAN}
  228. (cp:12000; name:'UTF32'),
  229. (cp:12000; name:'UTF-32'),
  230. {$endif}
  231. (cp:12001; name:'UTF-32BE'),
  232. (cp:12001; name:'CP12001'),
  233. (cp:12001; name:'UTF32BE'),
  234. {$ifdef FPC_BIG_ENDIAN}
  235. (cp:12001; name:'UTF32'),
  236. (cp:12001; name:'UTF-32'),
  237. {$endif}
  238. (cp:20000; name:'x-Chinese_CNS'), (* CNS Taiwan; Chinese Traditional (CNS) *)
  239. (cp:20001; name:'x-cp20001'), (* TCA Taiwan *)
  240. (cp:20002; name:'x_Chinese-Eten'), (* Eten Taiwan; Chinese Traditional (Eten) *)
  241. (cp:20003; name:'x-cp20003'), (* IBM5550 Taiwan *)
  242. (cp:20004; name:'x-cp20004'), (* TeleText Taiwan *)
  243. (cp:20005; name:'x-cp20005'), (* Wang Taiwan *)
  244. (cp:20105; name:'x-IA5'), (* IA5 (IRV International Alphabet No. 5, 7-bit); Western European (IA5) *)
  245. (cp:20106; name:'x-IA5-German'), (* IA5 German (7-bit) *)
  246. (cp:20107; name:'x-IA5-Swedish'), (* IA5 Swedish (7-bit) *)
  247. (cp:20108; name:'x-IA5-Norwegian'), (* IA5 Norwegian (7-bit) *)
  248. (cp:20127; name:'US-ASCII'),
  249. (cp:20127; name:'ASCII'),
  250. (cp:20127; name:'ANSI_X3.4-1968'),
  251. (cp:20127; name:'ANSI_X3.4-1986'),
  252. (cp:20127; name:'CP367'),
  253. (cp:20127; name:'IBM367'),
  254. (cp:20127; name:'ISO-IR-6'),
  255. (cp:20127; name:'ISO646-US'),
  256. (cp:20127; name:'ISO_646.IRV:1991'),
  257. (cp:20127; name:'US'),
  258. (cp:20127; name:'CSASCII'),
  259. (cp:20127; name:'us-ascii'), (* US-ASCII (7-bit) *)
  260. (cp:20261; name:'x-cp20261'), (* T.61 *)
  261. (cp:20269; name:'x-cp20269'), (* ISO 6937 Non-Spacing Accent *)
  262. (cp:20273; name:'IBM273'), (* IBM EBCDIC Germany *)
  263. (cp:20277; name:'IBM277'), (* IBM EBCDIC Denmark-Norway *)
  264. (cp:20278; name:'IBM278'), (* IBM EBCDIC Finland-Sweden *)
  265. (cp:20280; name:'IBM280'), (* IBM EBCDIC Italy *)
  266. (cp:20284; name:'IBM284'), (* IBM EBCDIC Latin America-Spain *)
  267. (cp:20285; name:'IBM285'), (* IBM EBCDIC United Kingdom *)
  268. (cp:20290; name:'IBM290'), (* IBM EBCDIC Japanese Katakana Extended *)
  269. (cp:20297; name:'IBM297'), (* IBM EBCDIC France *)
  270. (cp:20420; name:'IBM420'), (* IBM EBCDIC Arabic *)
  271. (cp:20423; name:'IBM423'), (* IBM EBCDIC Greek *)
  272. (cp:20424; name:'IBM424'), (* IBM EBCDIC Hebrew *)
  273. (cp:20833; name:'x-EBCDIC-KoreanExtended'), (* IBM EBCDIC Korean Extended *)
  274. (cp:20838; name:'IBM-Thai'), (* IBM EBCDIC Thai *)
  275. (cp:20866; name:'koi8-r'), (* Russian (KOI8-R); Cyrillic (KOI8-R) *)
  276. (cp:20871; name:'IBM871'), (* IBM EBCDIC Icelandic *)
  277. (cp:20880; name:'IBM880'), (* IBM EBCDIC Cyrillic Russian *)
  278. (cp:20905; name:'IBM905'), (* IBM EBCDIC Turkish *)
  279. (cp:20924; name:'IBM00924'), (* IBM EBCDIC Latin 1/Open System (1047 + Euro symbol) *)
  280. (cp:20932; name:'EUC-JP'), (* Japanese (JIS 0208-1990 and 0121-1990) *)
  281. (cp:20936; name:'x-cp20936'), (* Simplified Chinese (GB2312); Chinese Simplified (GB2312-80) *)
  282. (cp:20949; name:'x-cp20949'), (* Korean Wansung *)
  283. (cp:21025; name:'cp1025'), (* IBM EBCDIC Cyrillic Serbian-Bulgarian *)
  284. (cp:21866; name:'koi8-u'), (* Ukrainian (KOI8-U); Cyrillic (KOI8-U) *)
  285. (cp:28591; name:'ISO-8859-1'),
  286. (cp:28591; name:'ISO-IR-100'),
  287. (cp:28591; name:'ISO8859-1'),
  288. (cp:28591; name:'ISO_8859-1'),
  289. (cp:28591; name:'ISO_8859-1:1987'),
  290. (cp:28591; name:'L1'),
  291. (cp:28591; name:'LATIN1'),
  292. (cp:28591; name:'CSISOLATIN1'),
  293. (cp:28591; name:'iso-8859-1'), (* ISO 8859-1 Latin 1; Western European (ISO) *)
  294. (cp:28591; name:'iso8859-1'), (* ISO 8859-1 Latin 1; Western European (ISO) *)
  295. (cp:28592; name:'iso-8859-2'), (* ISO 8859-2 Central European; Central European (ISO) *)
  296. (cp:28592; name:'iso8859-2'), (* ISO 8859-2 Central European; Central European (ISO) *)
  297. (cp:28593; name:'iso-8859-3'), (* ISO 8859-3 Latin 3 *)
  298. (cp:28593; name:'iso8859-3'), (* ISO 8859-3 Latin 3 *)
  299. (cp:28594; name:'iso-8859-4'), (* ISO 8859-4 Baltic *)
  300. (cp:28594; name:'iso8859-4'), (* ISO 8859-4 Baltic *)
  301. (cp:28595; name:'iso-8859-5'), (* ISO 8859-5 Cyrillic *)
  302. (cp:28595; name:'iso8859-5'), (* ISO 8859-5 Cyrillic *)
  303. (cp:28596; name:'iso-8859-6'), (* ISO 8859-6 Arabic *)
  304. (cp:28596; name:'iso8859-6'), (* ISO 8859-6 Arabic *)
  305. (cp:28597; name:'iso-8859-7'), (* ISO 8859-7 Greek *)
  306. (cp:28597; name:'iso8859-7'), (* ISO 8859-7 Greek *)
  307. (cp:28598; name:'iso-8859-8'), (* ISO 8859-8 Hebrew; Hebrew (ISO-Visual) *)
  308. (cp:28598; name:'iso8859-8'), (* ISO 8859-8 Hebrew; Hebrew (ISO-Visual) *)
  309. (cp:28599; name:'iso-8859-9'), (* ISO 8859-9 Turkish *)
  310. (cp:28599; name:'iso8859-9'), (* ISO 8859-9 Turkish *)
  311. (cp:28603; name:'iso-8859-13'), (* ISO 8859-13 Estonian *)
  312. (cp:28603; name:'iso8859-13'), (* ISO 8859-13 Estonian *)
  313. (cp:28605; name:'iso-8859-15'), (* ISO 8859-15 Latin 9 *)
  314. (cp:28605; name:'iso8859-15'), (* ISO 8859-15 Latin 9 *)
  315. (cp:29001; name:'x-Europa'), (* Europa 3 *)
  316. (cp:38598; name:'iso-8859-8-i'), (* ISO 8859-8 Hebrew; Hebrew (ISO-Logical) *)
  317. (cp:38598; name:'iso8859-8-i'), (* ISO 8859-8 Hebrew; Hebrew (ISO-Logical) *)
  318. (cp:50220; name:'iso-2022-jp'), (* ISO 2022 Japanese with no halfwidth Katakana; Japanese (JIS) *)
  319. (cp:50221; name:'ISO-2022-JP'),
  320. (cp:50221; name:'CP50221'),
  321. (cp:50221; name:'ISO-2022-JP-MS'),
  322. (cp:50221; name:'ISO2022-JP'),
  323. (cp:50221; name:'ISO2022-JP-MS'),
  324. (cp:50221; name:'MS50221'),
  325. (cp:50221; name:'WINDOWS-50221'),
  326. (cp:50221; name:'csISO2022JP'), (* ISO 2022 Japanese with halfwidth Katakana; Japanese (JIS-Allow 1 byte Kana) *)
  327. (cp:50222; name:'iso-2022-jp'), (* ISO 2022 Japanese JIS X 0201-1989; Japanese (JIS-Allow 1 byte Kana - SO/SI) *)
  328. (cp:50225; name:'iso-2022-kr'), (* ISO 2022 Korean *)
  329. (cp:50225; name:'iso2022-kr'), (* ISO 2022 Korean *)
  330. (cp:50227; name:'x-cp50227'), (* ISO 2022 Simplified Chinese; Chinese Simplified (ISO 2022) *)
  331. (cp:51932; name:'EUC-JP'),
  332. (cp:51932; name:'CP51932'),
  333. (cp:51932; name:'MS51932'),
  334. (cp:51932; name:'WINDOWS-51932'),
  335. (cp:51932; name:'euc-jp'), (* EUC Japanese *)
  336. (cp:51936; name:'EUC-CN'), (* EUC Simplified Chinese; Chinese Simplified (EUC) *)
  337. (cp:51949; name:'euc-kr'), (* EUC Korean *)
  338. (cp:52936; name:'hz-gb-2312'), (* HZ-GB2312 Simplified Chinese; Chinese Simplified (HZ) *)
  339. (cp:54936; name:'GB18030'), (* Windows XP and later: GB18030 Simplified Chinese (4 byte); Chinese Simplified (GB18030) *)
  340. (cp:57002; name:'x-iscii-de'), (* ISCII Devanagari *)
  341. (cp:57003; name:'x-iscii-be'), (* ISCII Bengali *)
  342. (cp:57004; name:'x-iscii-ta'), (* ISCII Tamil *)
  343. (cp:57005; name:'x-iscii-te'), (* ISCII Telugu *)
  344. (cp:57006; name:'x-iscii-as'), (* ISCII Assamese *)
  345. (cp:57007; name:'x-iscii-or'), (* ISCII Oriya *)
  346. (cp:57008; name:'x-iscii-ka'), (* ISCII Kannada *)
  347. (cp:57009; name:'x-iscii-ma'), (* ISCII Malayalam *)
  348. (cp:57010; name:'x-iscii-gu'), (* ISCII Gujarati *)
  349. (cp:57011; name:'x-iscii-pa'), (* ISCII Punjabi *)
  350. (cp:65001; name:'UTF-8'),
  351. (cp:65001; name:'CP65001'),
  352. (cp:65001; name:'UTF8'));
  353. function win2iconv(cp: word): rawbytestring;
  354. var
  355. l, h, i, ccp: longint;
  356. begin
  357. l:=low(win2iconv_arr);
  358. h:=high(win2iconv_arr);
  359. repeat
  360. i:=(l+h+1) shr 1;
  361. ccp:=win2iconv_arr[i].cp;
  362. if cp=ccp then
  363. break;
  364. if cp>=ccp then
  365. l:=i
  366. else
  367. h:=i-1;
  368. until l>=h;
  369. if cp=win2iconv_arr[i].cp then
  370. begin
  371. { the array has been ordered so that in case multiple alias names
  372. exist, the first entry for the cp is the most commonly supported
  373. one
  374. }
  375. while (i>low(win2iconv_arr)) and
  376. (win2iconv_arr[i-1].cp=cp) do
  377. dec(i);
  378. result:=win2iconv_arr[i].name;
  379. end
  380. else
  381. { or better raise an error? }
  382. result:='<unsupported>';
  383. end;
  384. function iconv2win(cpname: rawbytestring): word;
  385. var
  386. i: longint;
  387. begin
  388. { clear encoding to prevent nonsense code page conversion of the input
  389. ansistring (encoding names are always ascii) }
  390. SetCodePage(cpname,$ffff,false);
  391. { simple linear scan, not a common operation and hence not worth
  392. building a separate array for }
  393. for i:=low(win2iconv_arr) to high(win2iconv_arr) do
  394. if win2iconv_arr[i].name=cpname then
  395. begin
  396. result:=win2iconv_arr[i].cp;
  397. exit;
  398. end;
  399. { rawbytestring (or better raise an error?) }
  400. result:=65535;
  401. end;