Ver código fonte

Add `io.write_quoted_*` utility procedures to `package io`

gingerBill 3 anos atrás
pai
commit
b3f2263442
2 arquivos alterados com 163 adições e 122 exclusões
  1. 153 0
      core/io/util.odin
  2. 10 122
      core/strings/builder.odin

+ 153 - 0
core/io/util.odin

@@ -2,6 +2,7 @@ package io
 
 import "core:mem"
 import "core:strconv"
+import "core:unicode/utf8"
 
 
 read_ptr :: proc(r: Reader, p: rawptr, byte_size: int) -> (n: int, err: Error) {
@@ -38,6 +39,158 @@ write_int :: proc(w: Writer, i: int, base: int = 10) -> (n: int, err: Error) {
 	return write_i64(w, i64(i), base)
 }
 
+
+
+@(private="file")
+DIGITS_LOWER := "0123456789abcdefx"
+
+@(private="file")
+n_write_byte :: proc(w: Writer, b: byte, bytes_processed: ^int) -> Error {
+	err := write_byte(w, b)
+	if err == nil {
+		bytes_processed^ += 1
+	}
+	return err
+}
+
+n_wrapper :: proc(n: int, err: Error, bytes_processed: ^int) -> Error {
+	bytes_processed^ += n
+	return err
+}
+
+
+write_encoded_rune :: proc(w: Writer, r: rune, write_quote := true) -> (n: int, err: Error) {
+	if write_quote {
+		n_write_byte(w, '\'', &n) or_return
+	}
+	switch r {
+	case '\a': n_wrapper(write_string(w, `\a"`), &n) or_return
+	case '\b': n_wrapper(write_string(w, `\b"`), &n) or_return
+	case '\e': n_wrapper(write_string(w, `\e"`), &n) or_return
+	case '\f': n_wrapper(write_string(w, `\f"`), &n) or_return
+	case '\n': n_wrapper(write_string(w, `\n"`), &n) or_return
+	case '\r': n_wrapper(write_string(w, `\r"`), &n) or_return
+	case '\t': n_wrapper(write_string(w, `\t"`), &n) or_return
+	case '\v': n_wrapper(write_string(w, `\v"`), &n) or_return
+	case:
+		if r < 32 {
+			n_wrapper(write_string(w, `\x`), &n) or_return
+			
+			buf: [2]byte
+			s := strconv.append_bits(buf[:], u64(r), 16, true, 64, strconv.digits, nil)
+			switch len(s) {
+			case 0: n_wrapper(write_string(w, "00"), &n) or_return
+			case 1: n_write_byte(w, '0', &n)             or_return
+			case 2: n_wrapper(write_string(w, s), &n)    or_return
+			}
+		} else {
+			n_wrapper(write_rune(w, r), &n) or_return
+		}
+
+	}
+	if write_quote {
+		n_write_byte(w, '\'', &n) or_return
+	}
+	return
+}
+
+write_escaped_rune :: proc(w: Writer, r: rune, quote: byte, html_safe := false) -> (n: int, err: Error) {
+	is_printable :: proc(r: rune) -> bool {
+		if r <= 0xff {
+			switch r {
+			case 0x20..=0x7e:
+				return true
+			case 0xa1..=0xff: // ¡ through ÿ except for the soft hyphen
+				return r != 0xad //
+			}
+		}
+
+		// TODO(bill): A proper unicode library will be needed!
+		return false
+	}
+	
+	if html_safe {
+		switch r {
+		case '<', '>', '&':
+			n_write_byte(w, '\\', &n) or_return
+			n_write_byte(w, 'u', &n)  or_return
+			for s := 12; s >= 0; s -= 4 {
+				n_write_byte(w, DIGITS_LOWER[r>>uint(s) & 0xf], &n) or_return
+			}
+			return
+		}
+	}
+
+	if r == rune(quote) || r == '\\' {
+		n_write_byte(w, '\\', &n)    or_return
+		n_write_byte(w, byte(r), &n) or_return
+		return
+	} else if is_printable(r) {
+		n_wrapper(write_encoded_rune(w, r, false), &n) or_return
+		return
+	}
+	switch r {
+	case '\a': n_wrapper(write_string(w, `\a`), &n) or_return
+	case '\b': n_wrapper(write_string(w, `\b`), &n) or_return
+	case '\e': n_wrapper(write_string(w, `\e`), &n) or_return
+	case '\f': n_wrapper(write_string(w, `\f`), &n) or_return
+	case '\n': n_wrapper(write_string(w, `\n`), &n) or_return
+	case '\r': n_wrapper(write_string(w, `\r`), &n) or_return
+	case '\t': n_wrapper(write_string(w, `\t`), &n) or_return
+	case '\v': n_wrapper(write_string(w, `\v`), &n) or_return
+	case:
+		switch c := r; {
+		case c < ' ':
+			n_write_byte(w, '\\', &n)                      or_return
+			n_write_byte(w, 'x', &n)                       or_return
+			n_write_byte(w, DIGITS_LOWER[byte(c)>>4], &n)  or_return
+			n_write_byte(w, DIGITS_LOWER[byte(c)&0xf], &n) or_return
+
+		case c > utf8.MAX_RUNE:
+			c = 0xfffd
+			fallthrough
+		case c < 0x10000:
+			n_write_byte(w, '\\', &n) or_return
+			n_write_byte(w, 'u', &n)  or_return
+			for s := 12; s >= 0; s -= 4 {
+				n_write_byte(w, DIGITS_LOWER[c>>uint(s) & 0xf], &n) or_return
+			}
+		case:
+			n_write_byte(w, '\\', &n) or_return
+			n_write_byte(w, 'U', &n)  or_return
+			for s := 28; s >= 0; s -= 4 {
+				n_write_byte(w, DIGITS_LOWER[c>>uint(s) & 0xf], &n) or_return
+			}
+		}
+	}
+	return
+}
+
+write_quoted_string :: proc(w: Writer, str: string, quote: byte = '"') -> (n: int, err: Error) {
+	n_write_byte(w, quote, &n) or_return
+	for width, s := 0, str; len(s) > 0; s = s[width:] {
+		r := rune(s[0])
+		width = 1
+		if r >= utf8.RUNE_SELF {
+			r, width = utf8.decode_rune_in_string(s)
+		}
+		if width == 1 && r == utf8.RUNE_ERROR {
+			n_write_byte(w, '\\', &n)                   or_return
+			n_write_byte(w, 'x', &n)                    or_return
+			n_write_byte(w, DIGITS_LOWER[s[0]>>4], &n)  or_return
+			n_write_byte(w, DIGITS_LOWER[s[0]&0xf], &n) or_return
+			continue
+		}
+
+		n_wrapper(write_escaped_rune(w, r, quote), &n) or_return
+
+	}
+	n_write_byte(w, quote, &n) or_return
+	return
+}
+
+
+
 Tee_Reader :: struct {
 	r: Reader,
 	w: Writer,

+ 10 - 122
core/strings/builder.odin

@@ -218,30 +218,13 @@ write_quoted_string :: proc{
 }
 
 write_quoted_string_builder :: proc(b: ^Builder, str: string, quote: byte = '"') -> (n: int) {
-	return write_quoted_string_writer(to_writer(b), str, quote)
+	n, _ = io.write_quoted_string(to_writer(b), str, quote)
+	return
 }
 
 write_quoted_string_writer :: proc(w: io.Writer, str: string, quote: byte = '"') -> (n: int) {
-	n += _write_byte(w, quote)
-	for width, s := 0, str; len(s) > 0; s = s[width:] {
-		r := rune(s[0])
-		width = 1
-		if r >= utf8.RUNE_SELF {
-			r, width = utf8.decode_rune_in_string(s)
-		}
-		if width == 1 && r == utf8.RUNE_ERROR {
-			n += _write_byte(w, '\\')
-			n += _write_byte(w, 'x')
-			n += _write_byte(w, DIGITS_LOWER[s[0]>>4])
-			n += _write_byte(w, DIGITS_LOWER[s[0]&0xf])
-			continue
-		}
-
-		n += write_escaped_rune(w, r, quote)
-
-	}
-	n += _write_byte(w, quote)
-	return
+	n, _ = io.write_quoted_string(w, str, quote)
+	return	
 }
 
 write_encoded_rune :: proc{
@@ -250,41 +233,12 @@ write_encoded_rune :: proc{
 }
 
 write_encoded_rune_builder :: proc(b: ^Builder, r: rune, write_quote := true) -> (n: int) {
-	return write_encoded_rune_writer(to_writer(b), r, write_quote)
+	n, _ = io.write_encoded_rune(to_writer(b), r, write_quote)
+	return
 
 }
 write_encoded_rune_writer :: proc(w: io.Writer, r: rune, write_quote := true) -> (n: int) {
-	if write_quote {
-		n += _write_byte(w, '\'')
-	}
-	switch r {
-	case '\a': n += write_string(w, `\a"`)
-	case '\b': n += write_string(w, `\b"`)
-	case '\e': n += write_string(w, `\e"`)
-	case '\f': n += write_string(w, `\f"`)
-	case '\n': n += write_string(w, `\n"`)
-	case '\r': n += write_string(w, `\r"`)
-	case '\t': n += write_string(w, `\t"`)
-	case '\v': n += write_string(w, `\v"`)
-	case:
-		if r < 32 {
-			n += write_string(w, `\x`)
-			buf: [2]byte
-			s := strconv.append_bits(buf[:], u64(r), 16, true, 64, strconv.digits, nil)
-			switch len(s) {
-			case 0: n += write_string(w, "00")
-			case 1: n += _write_byte(w, '0')
-			case 2: n += write_string(w, s)
-			}
-		} else {
-			rn, _ := io.write_rune(w, r)
-			n += rn
-		}
-
-	}
-	if write_quote {
-		n += _write_byte(w, '\'')
-	}
+	n, _ = io.write_encoded_rune(w, r, write_quote)
 	return
 }
 
@@ -295,78 +249,12 @@ write_escaped_rune :: proc{
 }
 
 write_escaped_rune_builder :: proc(b: ^Builder, r: rune, quote: byte, html_safe := false) -> (n: int) {
-	return write_escaped_rune_writer(to_writer(b), r, quote, html_safe)
+	n, _ = io.write_escaped_rune(to_writer(b), r, quote, html_safe)
+	return
 }
 
 write_escaped_rune_writer :: proc(w: io.Writer, r: rune, quote: byte, html_safe := false) -> (n: int) {
-	is_printable :: proc(r: rune) -> bool {
-		if r <= 0xff {
-			switch r {
-			case 0x20..=0x7e:
-				return true
-			case 0xa1..=0xff: // ¡ through ÿ except for the soft hyphen
-				return r != 0xad //
-			}
-		}
-
-		// TODO(bill): A proper unicode library will be needed!
-		return false
-	}
-
-	if html_safe {
-		switch r {
-		case '<', '>', '&':
-			n += _write_byte(w, '\\')
-			n += _write_byte(w, 'u')
-			for s := 12; s >= 0; s -= 4 {
-				n += _write_byte(w, DIGITS_LOWER[r>>uint(s) & 0xf])
-			}
-			return
-		}
-	}
-
-	if r == rune(quote) || r == '\\' {
-		n += _write_byte(w, '\\')
-		n += _write_byte(w, byte(r))
-		return
-	} else if is_printable(r) {
-		n += write_encoded_rune(w, r, false)
-		return
-	}
-	switch r {
-	case '\a': n += write_string(w, `\a`)
-	case '\b': n += write_string(w, `\b`)
-	case '\e': n += write_string(w, `\e`)
-	case '\f': n += write_string(w, `\f`)
-	case '\n': n += write_string(w, `\n`)
-	case '\r': n += write_string(w, `\r`)
-	case '\t': n += write_string(w, `\t`)
-	case '\v': n += write_string(w, `\v`)
-	case:
-		switch c := r; {
-		case c < ' ':
-			n += _write_byte(w, '\\')
-			n += _write_byte(w, 'x')
-			n += _write_byte(w, DIGITS_LOWER[byte(c)>>4])
-			n += _write_byte(w, DIGITS_LOWER[byte(c)&0xf])
-
-		case c > utf8.MAX_RUNE:
-			c = 0xfffd
-			fallthrough
-		case c < 0x10000:
-			n += _write_byte(w, '\\')
-			n += _write_byte(w, 'u')
-			for s := 12; s >= 0; s -= 4 {
-				n += _write_byte(w, DIGITS_LOWER[c>>uint(s) & 0xf])
-			}
-		case:
-			n += _write_byte(w, '\\')
-			n += _write_byte(w, 'U')
-			for s := 28; s >= 0; s -= 4 {
-				n += _write_byte(w, DIGITS_LOWER[c>>uint(s) & 0xf])
-			}
-		}
-	}
+	n, _ = io.write_escaped_rune(w, r, quote, html_safe)
 	return
 }