strconv.odin 9.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490
  1. import . "decimal.odin";
  2. IntFlag :: enum {
  3. Prefix = 1<<0,
  4. Plus = 1<<1,
  5. Space = 1<<2,
  6. }
  7. parse_bool :: proc(s: string) -> (result: bool, ok: bool) {
  8. match s {
  9. case "1", "t", "T", "true", "TRUE", "True":
  10. return true, true;
  11. case "0", "f", "F", "false", "FALSE", "False":
  12. return false, true;
  13. }
  14. return false, false;
  15. }
  16. _digit_value :: proc(r: rune) -> int {
  17. ri := int(r);
  18. v: int = 16;
  19. match r {
  20. case '0'..'9': v = ri-'0';
  21. case 'a'..'z': v = ri-'a'+10;
  22. case 'A'..'Z': v = ri-'A'+10;
  23. }
  24. return v;
  25. }
  26. parse_i128 :: proc(s: string) -> i128 {
  27. neg := false;
  28. if len(s) > 1 {
  29. match s[0] {
  30. case '-':
  31. neg = true;
  32. s = s[1..];
  33. case '+':
  34. s = s[1..];
  35. }
  36. }
  37. base: i128 = 10;
  38. if len(s) > 2 && s[0] == '0' {
  39. match s[1] {
  40. case 'b': base = 2; s = s[2..];
  41. case 'o': base = 8; s = s[2..];
  42. case 'd': base = 10; s = s[2..];
  43. case 'z': base = 12; s = s[2..];
  44. case 'x': base = 16; s = s[2..];
  45. }
  46. }
  47. value: i128;
  48. for r in s {
  49. if r == '_' {
  50. continue;
  51. }
  52. v := i128(_digit_value(r));
  53. if v >= base {
  54. break;
  55. }
  56. value *= base;
  57. value += v;
  58. }
  59. if neg do return -value;
  60. return value;
  61. }
  62. parse_u128 :: proc(s: string) -> u128 {
  63. neg := false;
  64. if len(s) > 1 && s[0] == '+' {
  65. s = s[1..];
  66. }
  67. base := u128(10);
  68. if len(s) > 2 && s[0] == '0' {
  69. match s[1] {
  70. case 'b': base = 2; s = s[2..];
  71. case 'o': base = 8; s = s[2..];
  72. case 'd': base = 10; s = s[2..];
  73. case 'z': base = 12; s = s[2..];
  74. case 'x': base = 16; s = s[2..];
  75. }
  76. }
  77. value: u128;
  78. for r in s {
  79. if r == '_' do continue;
  80. v := u128(_digit_value(r));
  81. if v >= base do break;
  82. value *= base;
  83. value += u128(v);
  84. }
  85. if neg do return -value;
  86. return value;
  87. }
  88. parse_int :: proc(s: string) -> int {
  89. return int(parse_i128(s));
  90. }
  91. parse_uint :: proc(s: string, base: int) -> uint {
  92. return uint(parse_u128(s));
  93. }
  94. parse_f64 :: proc(s: string) -> f64 {
  95. i := 0;
  96. sign: f64 = 1;
  97. match s[i] {
  98. case '-': i += 1; sign = -1;
  99. case '+': i += 1;
  100. }
  101. value: f64 = 0;
  102. for ; i < len(s); i += 1 {
  103. r := rune(s[i]);
  104. if r == '_' do continue;
  105. v := _digit_value(r);
  106. if v >= 10 do break;
  107. value *= 10;
  108. value += f64(v);
  109. }
  110. if s[i] == '.' {
  111. pow10: f64 = 10;
  112. i += 1;
  113. for ; i < len(s); i += 1 {
  114. r := rune(s[i]);
  115. if r == '_' do continue;
  116. v := _digit_value(r);
  117. if v >= 10 do break;
  118. value += f64(v)/pow10;
  119. pow10 *= 10;
  120. }
  121. }
  122. frac := false;
  123. scale: f64 = 1;
  124. if s[i] == 'e' || s[i] == 'E' {
  125. i += 1;
  126. match s[i] {
  127. case '-': i += 1; frac = true;
  128. case '+': i += 1;
  129. }
  130. exp: u32 = 0;
  131. for ; i < len(s); i += 1 {
  132. r := rune(s[i]);
  133. if r == '_' do continue;
  134. d := u32(_digit_value(r));
  135. if d >= 10 do break;
  136. exp = exp * 10 + d;
  137. }
  138. if exp > 308 { exp = 308; }
  139. for exp >= 50 { scale *= 1e50; exp -= 50; }
  140. for exp >= 8 { scale *= 1e8; exp -= 8; }
  141. for exp > 0 { scale *= 10; exp -= 1; }
  142. }
  143. if frac do return sign * (value/scale);
  144. return sign * (value*scale);
  145. }
  146. append_bool :: proc(buf: []u8, b: bool) -> string {
  147. if b {
  148. append(&buf, "true");
  149. } else {
  150. append(&buf, "false");
  151. }
  152. return string(buf);
  153. }
  154. append_uint :: proc(buf: []u8, u: u64, base: int) -> string {
  155. return append_bits(buf, u128(u), base, false, 8*size_of(uint), digits, 0);
  156. }
  157. append_int :: proc(buf: []u8, i: i64, base: int) -> string {
  158. return append_bits(buf, u128(i), base, true, 8*size_of(int), digits, 0);
  159. }
  160. itoa :: proc(buf: []u8, i: int) -> string { return append_int(buf, i64(i), 10); }
  161. append_float :: proc(buf: []u8, f: f64, fmt: u8, prec, bit_size: int) -> string {
  162. return string(generic_ftoa(buf, f, fmt, prec, bit_size));
  163. }
  164. DecimalSlice :: struct {
  165. digits: []u8;
  166. count: int;
  167. decimal_point: int;
  168. neg: bool;
  169. }
  170. FloatInfo :: struct {
  171. mantbits: uint;
  172. expbits: uint;
  173. bias: int;
  174. }
  175. _f16_info := FloatInfo{10, 5, -15};
  176. _f32_info := FloatInfo{23, 8, -127};
  177. _f64_info := FloatInfo{52, 11, -1023};
  178. generic_ftoa :: proc(buf: []u8, val: f64, fmt: u8, prec, bit_size: int) -> []u8 {
  179. bits: u64;
  180. flt: ^FloatInfo;
  181. match bit_size {
  182. case 32:
  183. bits = u64(transmute(u32)f32(val));
  184. flt = &_f32_info;
  185. case 64:
  186. bits = transmute(u64)val;
  187. flt = &_f64_info;
  188. case:
  189. panic("strconv: invalid bit_size");
  190. }
  191. neg := bits>>(flt.expbits+flt.mantbits) != 0;
  192. exp := int(bits>>flt.mantbits) & (1<<flt.expbits - 1);
  193. mant := bits & (u64(1) << flt.mantbits - 1);
  194. match exp {
  195. case 1<<flt.expbits - 1:
  196. s: string;
  197. if mant != 0 {
  198. s = "NaN";
  199. } else if neg {
  200. s = "-Inf";
  201. } else {
  202. s = "+Inf";
  203. }
  204. append(&buf, ...cast([]u8)s);
  205. return buf;
  206. case 0: // denormalized
  207. exp += 1;
  208. case:
  209. mant |= u64(1) << flt.mantbits;
  210. }
  211. exp += flt.bias;
  212. d_: Decimal;
  213. d := &d_;
  214. assign(d, mant);
  215. shift(d, exp - int(flt.mantbits));
  216. digs: DecimalSlice;
  217. shortest := prec < 0;
  218. if shortest {
  219. round_shortest(d, mant, exp, flt);
  220. digs = DecimalSlice{digits = d.digits[..], count = d.count, decimal_point = d.decimal_point};
  221. match fmt {
  222. case 'e', 'E': prec = digs.count-1;
  223. case 'f', 'F': prec = max(digs.count-digs.decimal_point, 0);
  224. case 'g', 'G': prec = digs.count;
  225. }
  226. } else {
  227. match fmt {
  228. case 'e', 'E': round(d, prec+1);
  229. case 'f', 'F': round(d, d.decimal_point+prec);
  230. case 'g', 'G':
  231. if prec == 0 {
  232. prec = 1;
  233. }
  234. round(d, prec);
  235. }
  236. digs = DecimalSlice{digits = d.digits[..], count = d.count, decimal_point = d.decimal_point};
  237. }
  238. return format_digits(buf, shortest, neg, digs, prec, fmt);
  239. }
  240. format_digits :: proc(buf: []u8, shortest: bool, neg: bool, digs: DecimalSlice, prec: int, fmt: u8) -> []u8 {
  241. match fmt {
  242. case 'f', 'F':
  243. append(&buf, neg ? '-' : '+');
  244. // integer, padded with zeros when needed
  245. if digs.decimal_point > 0 {
  246. m := min(digs.count, digs.decimal_point);
  247. append(&buf, ...digs.digits[..m]);
  248. for ; m < digs.decimal_point; m += 1 {
  249. append(&buf, '0');
  250. }
  251. } else {
  252. append(&buf, '0');
  253. }
  254. // fractional part
  255. if prec > 0 {
  256. append(&buf, '.');
  257. for i in 0..prec {
  258. c: u8 = '0';
  259. if j := digs.decimal_point + i; 0 <= j && j < digs.count {
  260. c = digs.digits[j];
  261. }
  262. append(&buf, c);
  263. }
  264. }
  265. return buf;
  266. case 'e', 'E':
  267. panic("strconv: e/E float printing is not yet supported");
  268. return buf; // TODO
  269. case 'g', 'G':
  270. panic("strconv: g/G float printing is not yet supported");
  271. return buf; // TODO
  272. }
  273. c := [2]u8{'%', fmt};
  274. append(&buf, ...c[..]);
  275. return buf;
  276. }
  277. round_shortest :: proc(d: ^Decimal, mant: u64, exp: int, flt: ^FloatInfo) {
  278. if mant == 0 { // If mantissa is zero, the number is zero
  279. d.count = 0;
  280. return;
  281. }
  282. /*
  283. 10^(dp-nd) > 2^(exp-mantbits)
  284. log2(10) * (dp-nd) > exp-mantbits
  285. log(2) >~ 0.332
  286. 332*(dp-nd) >= 100*(exp-mantbits)
  287. */
  288. minexp := flt.bias+1;
  289. if exp > minexp && 332*(d.decimal_point-d.count) >= 100*(exp - int(flt.mantbits)) {
  290. // Number is already its shortest
  291. return;
  292. }
  293. upper_: Decimal; upper := &upper_;
  294. assign(upper, 2*mant - 1);
  295. shift(upper, exp - int(flt.mantbits) - 1);
  296. mantlo: u64;
  297. explo: int;
  298. if mant > 1<<flt.mantbits || exp == minexp {
  299. mantlo = mant-1;
  300. explo = exp;
  301. } else {
  302. mantlo = 2*mant - 1;
  303. explo = exp-1;
  304. }
  305. lower_: Decimal; lower := &lower_;
  306. assign(lower, 2*mantlo + 1);
  307. shift(lower, explo - int(flt.mantbits) - 1);
  308. inclusive := mant%2 == 0;
  309. for i in 0..d.count {
  310. l: u8 = '0'; // lower digit
  311. if i < lower.count {
  312. l = lower.digits[i];
  313. }
  314. m := d.digits[i]; // middle digit
  315. u: u8 = '0'; // upper digit
  316. if i < upper.count {
  317. u = upper.digits[i];
  318. }
  319. ok_round_down := l != m || inclusive && i+1 == lower.count;
  320. ok_round_up := m != u && (inclusive || m+1 < u || i+1 < upper.count);
  321. if (ok_round_down && ok_round_up) {
  322. round(d, i+1);
  323. return;
  324. }
  325. if (ok_round_down) {
  326. round_down(d, i+1);
  327. return;
  328. }
  329. if (ok_round_up) {
  330. round_up(d, i+1);
  331. return;
  332. }
  333. }
  334. }
  335. MAX_BASE :: 32;
  336. digits := "0123456789abcdefghijklmnopqrstuvwxyz";
  337. is_integer_negative :: proc(u: u128, is_signed: bool, bit_size: int) -> (unsigned: u128, neg: bool) {
  338. neg := false;
  339. if is_signed {
  340. match bit_size {
  341. case 8:
  342. i := i8(u);
  343. neg = i < 0;
  344. if neg { i = -i; }
  345. u = u128(i);
  346. case 16:
  347. i := i16(u);
  348. neg = i < 0;
  349. if neg { i = -i; }
  350. u = u128(i);
  351. case 32:
  352. i := i32(u);
  353. neg = i < 0;
  354. if neg { i = -i; }
  355. u = u128(i);
  356. case 64:
  357. i := i64(u);
  358. neg = i < 0;
  359. if neg { i = -i; }
  360. u = u128(i);
  361. case 128:
  362. i := i128(u);
  363. neg = i < 0;
  364. if neg { i = -i; }
  365. u = u128(i);
  366. case:
  367. panic("is_integer_negative: Unknown integer size");
  368. }
  369. }
  370. return u, neg;
  371. }
  372. append_bits :: proc(buf: []u8, u: u128, base: int, is_signed: bool, bit_size: int, digits: string, flags: IntFlag) -> string {
  373. if base < 2 || base > MAX_BASE {
  374. panic("strconv: illegal base passed to append_bits");
  375. }
  376. neg: bool;
  377. a: [129]u8;
  378. i := len(a);
  379. u, neg = is_integer_negative(u, is_signed, bit_size);
  380. b := u128(base);
  381. for u >= b {
  382. i-=1; a[i] = digits[uint(u % b)];
  383. u /= b;
  384. }
  385. i-=1; a[i] = digits[uint(u % b)];
  386. if flags&IntFlag.Prefix != 0 {
  387. ok := true;
  388. match base {
  389. case 2: i-=1; a[i] = 'b';
  390. case 8: i-=1; a[i] = 'o';
  391. case 10: i-=1; a[i] = 'd';
  392. case 12: i-=1; a[i] = 'z';
  393. case 16: i-=1; a[i] = 'x';
  394. case: ok = false;
  395. }
  396. if ok {
  397. i-=1; a[i] = '0';
  398. }
  399. }
  400. if neg {
  401. i-=1; a[i] = '-';
  402. } else if flags&IntFlag.Plus != 0 {
  403. i-=1; a[i] = '+';
  404. } else if flags&IntFlag.Space != 0 {
  405. i-=1; a[i] = ' ';
  406. }
  407. append(&buf, ...a[i..]);
  408. return string(buf);
  409. }