123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277 |
- /*
- * Copyright (C)2005-2012 Haxe Foundation
- *
- * Permission is hereby granted, free of charge, to any person obtaining a
- * copy of this software and associated documentation files (the "Software"),
- * to deal in the Software without restriction, including without limitation
- * the rights to use, copy, modify, merge, publish, distribute, sublicense,
- * and/or sell copies of the Software, and to permit persons to whom the
- * Software is furnished to do so, subject to the following conditions:
- *
- * The above copyright notice and this permission notice shall be included in
- * all copies or substantial portions of the Software.
- *
- * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
- * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
- * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
- * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
- * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
- * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
- * DEALINGS IN THE SOFTWARE.
- */
- import python.internal.UBuiltins;
- import python.lib.Re;
- import python.lib.Re.MatchObject;
- import python.lib.Re.Pattern;
- @:coreApi
- class EReg {
- /**
- Creates a new regular expression with pattern `r` and modifiers `opt`.
- This is equivalent to the shorthand syntax `~/r/opt`
- If `r` or `opt` are null, the result is unspecified.
- **/
- var pattern:Regex;
- var matchObj:MatchObject;
- var global:Bool;
- public function new( r : String, opt : String ) {
- global = false;
- var options = 0;
- for (i in 0...opt.length) {
- var c = StringTools.fastCodeAt(opt, i);
- if (c == "m".code) options |= Re.M;
- if (c == "i".code) options |= Re.I;
- if (c == "s".code) options |= Re.S;
- if (c == "u".code) options |= Re.U;
- if (c == "g".code) global = true;
- }
- pattern = Re.compile(r, options);
- }
- /**
- Tells if `this` regular expression matches String `s`.
- This method modifies the internal state.
- If `s` is `null`, the result is unspecified.
- **/
- public inline function match( s : String ) : Bool {
- matchObj = Re.search(pattern, s);
- return matchObj != null;
- }
- /**
- Returns the matched sub-group `n` of `this` EReg.
- This method should only be called after `this.match` or
- `this.matchSub`, and then operates on the String of that operation.
- The index `n` corresponds to the n-th set of parentheses in the pattern
- of `this` EReg. If no such sub-group exists, an exception is thrown.
- If `n` equals 0, the whole matched substring is returned.
- **/
- public inline function matched( n : Int ) : String {
- return matchObj.group(n);
- }
- /**
- Returns the part to the left of the last matched substring.
- If the most recent call to `this.match` or `this.matchSub` did not
- match anything, the result is unspecified.
- If the global g modifier was in place for the matching, only the
- substring to the left of the leftmost match is returned.
- The result does not include the matched part.
- **/
- public inline function matchedLeft() : String {
- return matchObj.string.substr(0, matchObj.start());
- }
- /**
- Returns the part to the right of the last matched substring.
- If the most recent call to `this.match` or `this.matchSub` did not
- match anything, the result is unspecified.
- If the global g modifier was in place for the matching, only the
- substring to the right of the leftmost match is returned.
- The result does not include the matched part.
- **/
- public inline function matchedRight() : String {
- return matchObj.string.substr(matchObj.end());
- }
- /**
- Returns the position and length of the last matched substring, within
- the String which was last used as argument to `this.match` or
- `this.matchSub`.
- If the most recent call to `this.match` or `this.matchSub` did not
- match anything, the result is unspecified.
- If the global g modifier was in place for the matching, the position and
- length of the leftmost substring is returned.
- **/
- public inline function matchedPos() : { pos : Int, len : Int } {
- return { pos : matchObj.start(), len : matchObj.end() - matchObj.start() };
- }
- /**
- Tells if `this` regular expression matches a substring of String `s`.
- This function expects `pos` and `len` to describe a valid substring of
- `s`, or else the result is unspecified. To get more robust behavior,
- `this.matchSub(s.substr(pos,len))` can be used instead.
- This method modifies the internal state.
- If `s` is null, the result is unspecified.
- **/
- public function matchSub( s : String, pos : Int, len : Int = -1):Bool {
- if (len != -1) {
- matchObj = pattern.search(s, pos, pos+len);
- } else {
- matchObj = pattern.search(s, pos);
- }
- return this.matchObj != null;
- }
- /**
- Splits String `s` at all substrings `this` EReg matches.
- If a match is found at the start of `s`, the result contains a leading
- empty String "" entry.
- If a match is found at the end of `s`, the result contains a trailing
- empty String "" entry.
- If two matching substrings appear next to each other, the result
- contains the empty String "" between them.
- By default, this method splits `s` into two parts at the first matched
- substring. If the global g modifier is in place, `s` is split at each
- matched substring.
- If `s` is null, the result is unspecified.
- **/
- public function split( s : String ) : Array<String> {
- return if (global) {
- var ret = [];
- var lastEnd = 0;
- for (x in Re.finditer(pattern, s)) {
- ret.push(s.substring(lastEnd, x.start() ));
- lastEnd = x.end();
- }
- ret.push(s.substr(lastEnd));
- ret;
- } else {
- this.match(s);
- if (matchObj == null) {
- [s];
- } else {
- [ s.substring(0, matchObj.start()), s.substr(matchObj.end()) ];
- }
- }
- }
- /**
- Replaces the first substring of `s` which `this` EReg matches with `by`.
- If `this` EReg does not match any substring, the result is `s`.
- By default, this method replaces only the first matched substring. If
- the global g modifier is in place, all matched substrings are replaced.
- If `by` contains `$1` to `$9`, the digit corresponds to number of a
- matched sub-group and its value is used instead. If no such sub-group
- exists, the replacement is unspecified. The string `$$` becomes `$`.
- If `s` or `by` are null, the result is unspecified.
- **/
- public function replace( s : String, by : String ) : String
- {
- var by = by.split("$$").join("_hx_#repl#__");
- function replace (x:MatchObject) {
- var res = by;
- var g = x.groups();
- for (i in 0...g.length) {
- res = res.split("$"+UBuiltins.str(i+1)).join(g[i]);
- }
- res = res.split("_hx_#repl#__").join("$");
- return res;
- }
- return Re.sub(pattern, replace, s, global ? 0 : 1 );
- }
- /**
- For each occurence of the pattern in the string `s`, the function `f` is called and
- can return the string that needs to be replaced. All occurences are matched anyway,
- and setting the `g` flag might cause some incorrect behavior on some platforms.
- **/
- public function map( s : String, f : EReg -> String ) : String {
- var buf = new StringBuf();
- var pos = 0;
- var right = s;
- var cur = this;
- while( pos < s.length ) {
- if (matchObj == null) {
- matchObj = Re.search(pattern, s);
- } else {
- matchObj = matchObj.re.search(s, pos);
- }
- if( matchObj == null )
- break;
- var pos1 = matchObj.end();
- var curPos = cur.matchedPos();
- buf.add(cur.matchedLeft().substr(pos));
- buf.add(f(cur));
- right = cur.matchedRight();
- if (!global) {
- buf.add(right);
- return buf.toString();
- }
- if (curPos.len == 0) {
- buf.add(s.charAt(pos1));
- right = right.substr(1);
- pos = pos1+1;
- } else {
- pos = pos1;
- }
- }
- buf.add(right);
- return buf.toString();
- }
- }
|