EReg.hx 4.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174
  1. /*
  2. * Copyright (C)2005-2018 Haxe Foundation
  3. *
  4. * Permission is hereby granted, free of charge, to any person obtaining a
  5. * copy of this software and associated documentation files (the "Software"),
  6. * to deal in the Software without restriction, including without limitation
  7. * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  8. * and/or sell copies of the Software, and to permit persons to whom the
  9. * Software is furnished to do so, subject to the following conditions:
  10. *
  11. * The above copyright notice and this permission notice shall be included in
  12. * all copies or substantial portions of the Software.
  13. *
  14. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  15. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  16. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
  17. * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  18. * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
  19. * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
  20. * DEALINGS IN THE SOFTWARE.
  21. */
  22. import lua.lib.lrexlib.Rex;
  23. import lua.Table;
  24. import lua.Lib;
  25. import lua.NativeStringTools;
  26. @:coreApi
  27. class EReg {
  28. var r : Rex; // the Rex extern instance.
  29. var global : Bool; // whether the regex is in global mode.
  30. var s : String; // the last matched string
  31. var m : Table<Int,Int>; // the [start:Int, end:Int, and submatches:String (matched groups)] as a single table.
  32. static var FLAGS : Table<String,Int> = Rex.flags();
  33. public function new( r : String, opt : String ) : Void {
  34. var ropt = 0;
  35. for (i in 0...opt.length){
  36. switch(opt.charAt(i)){
  37. case "i" : ropt |= FLAGS.CASELESS;
  38. case "m" : ropt |= FLAGS.MULTILINE;
  39. case "s" : ropt |= FLAGS.DOTALL;
  40. case "g" : global = true;
  41. default : null;
  42. }
  43. }
  44. ropt |= FLAGS.UTF8; // always check validity of utf8 string
  45. ropt |= FLAGS.UCP; // always enable utf8 character properties
  46. if (global == null) global = false;
  47. this.r = Rex.create(r, ropt);
  48. }
  49. public function match( s : String ) : Bool {
  50. if (s == null) return false;
  51. this.m = lua.TableTools.pack(r.exec(s));
  52. this.s = s;
  53. return m[1] != null;
  54. }
  55. public function matched( n : Int ) : String {
  56. if (m[1] == null || n < 0) throw "EReg::matched";
  57. else if (n == 0) {
  58. var k = NativeStringTools.sub(s, m[1], m[2]).match;
  59. return k;
  60. } else if (Std.is(m[3], lua.Table)){
  61. var mn = 2 * (n - 1);
  62. if (Std.is(untyped m[3][mn+1], Bool)) return null;
  63. return NativeStringTools.sub(s, untyped m[3][mn + 1], untyped m[3][mn + 2]).match;
  64. } else {
  65. throw "EReg:matched";
  66. }
  67. }
  68. public function matchedLeft() : String {
  69. if( m[1] == null ) throw "No string matched";
  70. return NativeStringTools.sub(s, 1, m[1]-1).match;
  71. }
  72. public function matchedRight() : String {
  73. if( m[1] == null ) throw "No string matched";
  74. return NativeStringTools.sub(s, m[2]+1).match;
  75. }
  76. public function matchedPos() : { pos : Int, len : Int } {
  77. var left = matchedLeft();
  78. var matched = matched(0);
  79. if( m[1] == null ) throw "No string matched";
  80. return {
  81. pos : left.length,
  82. len : matched.length
  83. }
  84. }
  85. public function matchSub( s : String, pos : Int, len : Int = -1):Bool {
  86. var ss = s.substr(0, len < 0 ? s.length : pos + len);
  87. if (global){
  88. m = lua.TableTools.pack(r.exec(ss, pos + 1));
  89. var b = m[1] != null;
  90. if (b){
  91. this.s = s;
  92. }
  93. return b;
  94. } else {
  95. m = lua.TableTools.pack(r.exec(ss, pos + 1));
  96. var b = m[1] != null;
  97. if (b){
  98. this.s = s;
  99. }
  100. return b;
  101. }
  102. }
  103. public function split( s : String ) : Array<String> {
  104. if (global){
  105. return Lib.fillArray(Rex.split(s, r));
  106. } else {
  107. // we can't use directly Rex.split because it's ignoring the 'g' flag
  108. var d = "#__delim__#";
  109. return Lib.fillArray(Rex.split(replace(s,d), d));
  110. }
  111. }
  112. public function replace( s : String, by : String ) : String {
  113. var chunks = by.split("$$");
  114. chunks = [for (chunk in chunks) Rex.gsub(chunk, "\\$(\\d)", "%%%1", 1)];
  115. by = chunks.join("$");
  116. return Rex.gsub(s,r,by, global ? null : 1);
  117. }
  118. public function map( s : String, f : EReg -> String ) : String {
  119. var offset = 0;
  120. var buf = new StringBuf();
  121. do {
  122. if (offset >= s.length){
  123. break;
  124. }
  125. else if (!matchSub(s, offset)) {
  126. buf.add(s.substr(offset));
  127. break;
  128. }
  129. var p = matchedPos();
  130. buf.add(s.substr(offset, p.pos - offset));
  131. buf.add(f(this));
  132. if (p.len == 0) {
  133. buf.add(s.substr(p.pos, 1));
  134. offset = p.pos + 1;
  135. }
  136. else
  137. offset = p.pos + p.len;
  138. } while (global);
  139. if (!global && offset > 0 && offset < s.length)
  140. buf.add(s.substr(offset));
  141. return buf.toString();
  142. }
  143. public static function escape( s : String ) : String {
  144. return escapeRegExpRe.map(s, function(r) return "\\" + r.matched(0));
  145. }
  146. static var escapeRegExpRe = ~/[\[\]{}()*+?.\\\^$|]/g;
  147. static function __init__() : Void {
  148. if (Rex == null){
  149. throw "Rex is missing. Please install lrexlib-pcre.";
  150. }
  151. }
  152. }