2
0

EReg.hx 4.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184
  1. /*
  2. * Copyright (C)2005-2017 Haxe Foundation
  3. *
  4. * Permission is hereby granted, free of charge, to any person obtaining a
  5. * copy of this software and associated documentation files (the "Software"),
  6. * to deal in the Software without restriction, including without limitation
  7. * the rights to use, copy, modify, merge, publish, distribute, sublicense,
  8. * and/or sell copies of the Software, and to permit persons to whom the
  9. * Software is furnished to do so, subject to the following conditions:
  10. *
  11. * The above copyright notice and this permission notice shall be included in
  12. * all copies or substantial portions of the Software.
  13. *
  14. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  15. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  16. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
  17. * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  18. * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
  19. * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
  20. * DEALINGS IN THE SOFTWARE.
  21. */
  22. import java.util.regex.*;
  23. @:coreApi class EReg {
  24. private var pattern:String;
  25. private var matcher:Matcher;
  26. private var cur:String;
  27. private var isGlobal:Bool;
  28. public function new( r : String, opt : String ) {
  29. var flags = 0;
  30. for (i in 0...opt.length)
  31. {
  32. switch(StringTools.fastCodeAt(opt, i))
  33. {
  34. case 'i'.code:
  35. flags |= Pattern.CASE_INSENSITIVE;
  36. case 'm'.code:
  37. flags |= Pattern.MULTILINE;
  38. case 's'.code:
  39. flags |= Pattern.DOTALL;
  40. case 'g'.code:
  41. isGlobal = true;
  42. }
  43. }
  44. matcher = Pattern.compile(convert(r), flags).matcher("");
  45. pattern = r;
  46. }
  47. private static function convert(r:String):String
  48. {
  49. //some references of the implementation:
  50. //http://stackoverflow.com/questions/809647/java-vs-javascript-regex-problem
  51. //http://stackoverflow.com/questions/4788413/how-to-convert-javascript-regex-to-safe-java-regex
  52. //Some necessary changes:
  53. //
  54. // \0 -> \x00
  55. // \v -> \x0b
  56. // [^] -> [\s\S]
  57. // unescaped ', " -> \', \"
  58. /* FIXME
  59. var pat = new StringBuf();
  60. var len = r.length;
  61. var i = 0;
  62. while (i < len)
  63. {
  64. var c = StringTools.fastCodeAt(r, i++);
  65. switch(c)
  66. {
  67. case '\\'.code: //escape-sequence
  68. }
  69. }
  70. */
  71. return r;
  72. }
  73. public function match( s : String ) : Bool {
  74. cur = s;
  75. matcher = matcher.reset(s);
  76. return matcher.find();
  77. }
  78. public function matched( n : Int ) : String
  79. {
  80. if (n == 0)
  81. return matcher.group();
  82. else
  83. return matcher.group(n);
  84. }
  85. public function matchedLeft() : String
  86. {
  87. return untyped cur.substring(0, matcher.start());
  88. }
  89. public function matchedRight() : String
  90. {
  91. return untyped cur.substring(matcher.end(), cur.length);
  92. }
  93. public function matchedPos() : { pos : Int, len : Int } {
  94. var start = matcher.start();
  95. return { pos : start, len : matcher.end() - start };
  96. }
  97. public function matchSub( s : String, pos : Int, len : Int = -1):Bool {
  98. matcher = matcher.reset(len < 0 ? s : s.substr(0,pos + len));
  99. cur = s;
  100. return matcher.find(pos);
  101. }
  102. public function split( s : String ) : Array<String>
  103. {
  104. if (isGlobal)
  105. {
  106. var ret = [];
  107. while(this.match(s))
  108. {
  109. ret.push(matchedLeft());
  110. s = matchedRight();
  111. }
  112. ret.push(s);
  113. return ret;
  114. } else {
  115. var m = matcher;
  116. m.reset(s);
  117. if (m.find())
  118. {
  119. return untyped [s.substring(0, m.start()), s.substring(m.end(), s.length)];
  120. } else {
  121. return [s];
  122. }
  123. }
  124. }
  125. inline function start(group:Int) : Int
  126. {
  127. return matcher.start(group);
  128. }
  129. inline function len(group:Int) : Int
  130. {
  131. return matcher.end(group) - matcher.start(group);
  132. }
  133. public function replace( s : String, by : String ) : String
  134. {
  135. matcher.reset(s);
  136. by = by.split("$$").join("\\$");
  137. return isGlobal ? matcher.replaceAll(by) : matcher.replaceFirst(by);
  138. }
  139. public function map( s : String, f : EReg -> String ) : String {
  140. var offset = 0;
  141. var buf = new StringBuf();
  142. do {
  143. if (offset >= s.length)
  144. break;
  145. else if (!matchSub(s, offset)) {
  146. buf.add(s.substr(offset));
  147. break;
  148. }
  149. var p = matchedPos();
  150. buf.add(s.substr(offset, p.pos - offset));
  151. buf.add(f(this));
  152. if (p.len == 0) {
  153. buf.add(s.substr(p.pos, 1));
  154. offset = p.pos + 1;
  155. }
  156. else
  157. offset = p.pos + p.len;
  158. } while (isGlobal);
  159. if (!isGlobal && offset > 0 && offset < s.length)
  160. buf.add(s.substr(offset));
  161. return buf.toString();
  162. }
  163. public static inline function escape( s : String ) : String {
  164. return Pattern.quote(s);
  165. }
  166. }