Utf8.hx 2.8 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788
  1. /*
  2. * Copyright (c) 2005, The haXe Project Contributors
  3. * All rights reserved.
  4. * Redistribution and use in source and binary forms, with or without
  5. * modification, are permitted provided that the following conditions are met:
  6. *
  7. * - Redistributions of source code must retain the above copyright
  8. * notice, this list of conditions and the following disclaimer.
  9. * - Redistributions in binary form must reproduce the above copyright
  10. * notice, this list of conditions and the following disclaimer in the
  11. * documentation and/or other materials provided with the distribution.
  12. *
  13. * THIS SOFTWARE IS PROVIDED BY THE HAXE PROJECT CONTRIBUTORS "AS IS" AND ANY
  14. * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
  15. * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
  16. * DISCLAIMED. IN NO EVENT SHALL THE HAXE PROJECT CONTRIBUTORS BE LIABLE FOR
  17. * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  18. * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
  19. * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
  20. * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  21. * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  22. * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH
  23. * DAMAGE.
  24. */
  25. package haxe;
  26. @:core_api
  27. class Utf8 {
  28. var __b : String;
  29. public function new( ?size : Int ) : Void {
  30. __b = '';
  31. }
  32. public function addChar( c : Int ) : Void {
  33. __b += uchr(c);
  34. }
  35. public function toString() : String {
  36. return __b;
  37. }
  38. public static function encode( s : String ) : String {
  39. return untyped __call__("utf8_encode", s);
  40. }
  41. public static function decode( s : String ) : String {
  42. return untyped __call__("utf8_decode", s);
  43. }
  44. public static function iter(s : String, chars : Int -> Void ) : Void {
  45. var len = length(s);
  46. for(i in 0...len)
  47. chars(charCodeAt(s, i));
  48. }
  49. public static function charCodeAt( s : String, index : Int ) : Int {
  50. return uord(sub(s, index, 1));
  51. }
  52. static function uchr(i : Int) : String {
  53. return untyped __php__("mb_convert_encoding(pack('N',$i), 'UTF-8', 'UCS-4BE')");
  54. }
  55. static function uord(s : String) : Int untyped {
  56. var c : Array<Int> = untyped __php__("unpack('N', mb_convert_encoding($s, 'UCS-4BE', 'UTF-8'))");
  57. return c[1];
  58. }
  59. public static function validate( s : String ) : Bool {
  60. return untyped __call__("mb_check_encoding", s, enc);
  61. }
  62. public static function length( s : String ) : Int {
  63. return untyped __call__("mb_strlen", s, enc);
  64. }
  65. public static function compare( a : String, b : String ) : Int {
  66. return untyped __call__("strcmp", a, b);
  67. }
  68. public static function sub( s : String, pos : Int, len : Int ) : String {
  69. return untyped __call__("mb_substr", s, pos, len, enc);
  70. }
  71. private static inline var enc = "UTF-8";
  72. }