Utf8.hx 2.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687
  1. /*
  2. * Copyright (c) 2005, The haXe Project Contributors
  3. * All rights reserved.
  4. * Redistribution and use in source and binary forms, with or without
  5. * modification, are permitted provided that the following conditions are met:
  6. *
  7. * - Redistributions of source code must retain the above copyright
  8. * notice, this list of conditions and the following disclaimer.
  9. * - Redistributions in binary form must reproduce the above copyright
  10. * notice, this list of conditions and the following disclaimer in the
  11. * documentation and/or other materials provided with the distribution.
  12. *
  13. * THIS SOFTWARE IS PROVIDED BY THE HAXE PROJECT CONTRIBUTORS "AS IS" AND ANY
  14. * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
  15. * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
  16. * DISCLAIMED. IN NO EVENT SHALL THE HAXE PROJECT CONTRIBUTORS BE LIABLE FOR
  17. * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  18. * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
  19. * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
  20. * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  21. * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  22. * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH
  23. * DAMAGE.
  24. */
  25. package php;
  26. class Utf8 {
  27. var __b : String;
  28. public function new() {
  29. __b = '';
  30. }
  31. public function addChar( c : Int ) {
  32. __b += uchr(c);
  33. }
  34. public function toString() : String {
  35. return __b;
  36. }
  37. public static function encode( s : String ) : String {
  38. return untyped __call__("utf8_encode", s);
  39. }
  40. public static function decode( s : String ) : String {
  41. return untyped __call__("utf8_decode", s);
  42. }
  43. public static function iter(s : String, chars : Int -> Void ) {
  44. var len = length(s);
  45. for(i in 0...len)
  46. chars(charCodeAt(s, i));
  47. }
  48. public static function charCodeAt( s : String, index : Int ) : Int {
  49. return uord(sub(s, index, 1));
  50. }
  51. public static function uchr(i : Int) : String {
  52. return untyped __php__("mb_convert_encoding(pack('N',$i), mb_internal_encoding(), 'UCS-4BE')");
  53. }
  54. public static function uord(s : String) : Int untyped {
  55. var c : Array<Int> = untyped __php__("unpack('N', mb_convert_encoding($s, 'UCS-4BE', 'UTF-8'))");
  56. return c[1];
  57. }
  58. public static function validate( s : String ) : Bool {
  59. return untyped __call__("mb_check_encoding", s, enc);
  60. }
  61. public static function length( s : String ) : Int {
  62. return untyped __call__("mb_strlen", s, enc);
  63. }
  64. public static function compare( a : String, b : String ) : Int {
  65. return untyped __call__("strcmp", a, b);
  66. }
  67. public static function sub( s : String, pos : Int, len : Int ) : String {
  68. return untyped __call__("mb_substr", s, pos, len, enc);
  69. }
  70. private static inline var enc = "UTF-8";
  71. }