strconv.odin 9.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498
  1. #import . "decimal.odin";
  2. IntFlag :: enum {
  3. Prefix = 1<<0,
  4. Plus = 1<<1,
  5. Space = 1<<2,
  6. }
  7. parse_bool :: proc(s: string) -> (result: bool, ok: bool) {
  8. match s {
  9. case "1", "t", "T", "true", "TRUE", "True":
  10. return true, true;
  11. case "0", "f", "F", "false", "FALSE", "False":
  12. return false, true;
  13. }
  14. return false, false;
  15. }
  16. _digit_value :: proc(r: rune) -> (int) {
  17. ri := int(r);
  18. v: int = 16;
  19. match r {
  20. case '0'..'9': v = ri-'0';
  21. case 'a'..'z': v = ri-'a'+10;
  22. case 'A'..'Z': v = ri-'A'+10;
  23. }
  24. return v;
  25. }
  26. parse_i128 :: proc(s: string) -> i128 {
  27. neg := false;
  28. if len(s) > 1 {
  29. match s[0] {
  30. case '-':
  31. neg = true;
  32. s = s[1..];
  33. case '+':
  34. s = s[1..];
  35. }
  36. }
  37. base: i128 = 10;
  38. if len(s) > 2 && s[0] == '0' {
  39. match s[1] {
  40. case 'b': base = 2; s = s[2..];
  41. case 'o': base = 8; s = s[2..];
  42. case 'd': base = 10; s = s[2..];
  43. case 'z': base = 12; s = s[2..];
  44. case 'x': base = 16; s = s[2..];
  45. }
  46. }
  47. value: i128;
  48. for r in s {
  49. if r == '_' {
  50. continue;
  51. }
  52. v := i128(_digit_value(r));
  53. if v >= base {
  54. break;
  55. }
  56. value *= base;
  57. value += v;
  58. }
  59. return neg ? -value : value;
  60. }
  61. parse_u128 :: proc(s: string) -> u128 {
  62. neg := false;
  63. if len(s) > 1 && s[0] == '+' {
  64. s = s[1..];
  65. }
  66. base: = u128(10);
  67. if len(s) > 2 && s[0] == '0' {
  68. match s[1] {
  69. case 'b': base = 2; s = s[2..];
  70. case 'o': base = 8; s = s[2..];
  71. case 'd': base = 10; s = s[2..];
  72. case 'z': base = 12; s = s[2..];
  73. case 'x': base = 16; s = s[2..];
  74. }
  75. }
  76. value: u128;
  77. for r in s {
  78. if r == '_' {
  79. continue;
  80. }
  81. v := u128(_digit_value(r));
  82. if v >= base {
  83. break;
  84. }
  85. value *= base;
  86. value += u128(v);
  87. }
  88. return neg ? -value : value;
  89. }
  90. parse_int :: proc(s: string) -> int {
  91. return int(parse_i128(s));
  92. }
  93. parse_uint :: proc(s: string, base: int) -> uint {
  94. return uint(parse_u128(s));
  95. }
  96. parse_f64 :: proc(s: string) -> f64 {
  97. i := 0;
  98. sign: f64 = 1;
  99. match s[i] {
  100. case '-': i++; sign = -1;
  101. case '+': i++;
  102. }
  103. value: f64 = 0;
  104. for ; i < len(s); i++ {
  105. r := rune(s[i]);
  106. if r == '_' {
  107. continue;
  108. }
  109. v := _digit_value(r);
  110. if v >= 10 {
  111. break;
  112. }
  113. value *= 10;
  114. value += f64(v);
  115. }
  116. if s[i] == '.' {
  117. pow10: f64 = 10;
  118. i++;
  119. for ; i < len(s); i++ {
  120. r := rune(s[i]);
  121. if r == '_' {
  122. continue;
  123. }
  124. v := _digit_value(r);
  125. if v >= 10 {
  126. break;
  127. }
  128. value += f64(v)/pow10;
  129. pow10 *= 10;
  130. }
  131. }
  132. frac := false;
  133. scale: f64 = 1;
  134. if s[i] == 'e' || s[i] == 'E' {
  135. i++;
  136. match s[i] {
  137. case '-': i++; frac = true;
  138. case '+': i++;
  139. }
  140. exp: u32 = 0;
  141. for ; i < len(s); i++ {
  142. r := rune(s[i]);
  143. if r == '_' {
  144. continue;
  145. }
  146. d := u32(_digit_value(r));
  147. if d >= 10 {
  148. break;
  149. }
  150. exp = exp * 10 + d;
  151. }
  152. if exp > 308 { exp = 308; }
  153. for exp >= 50 { scale *= 1e50; exp -= 50; }
  154. for exp >= 8 { scale *= 1e8; exp -= 8; }
  155. for exp > 0 { scale *= 10; exp -= 1; }
  156. }
  157. return sign * (frac ? (value/scale) : (value*scale));
  158. }
  159. append_bool :: proc(buf: []u8, b: bool) -> string {
  160. s := b ? "true" : "false";
  161. append(buf, ..[]u8(s));
  162. return string(buf);
  163. }
  164. append_uint :: proc(buf: []u8, u: u64, base: int) -> string {
  165. return append_bits(buf, u128(u), base, false, 8*size_of(uint), digits, 0);
  166. }
  167. append_int :: proc(buf: []u8, i: i64, base: int) -> string {
  168. return append_bits(buf, u128(i), base, true, 8*size_of(int), digits, 0);
  169. }
  170. itoa :: proc(buf: []u8, i: int) -> string { return append_int(buf, i64(i), 10); }
  171. append_float :: proc(buf: []u8, f: f64, fmt: u8, prec, bit_size: int) -> string {
  172. return string(generic_ftoa(buf, f, fmt, prec, bit_size));
  173. }
  174. DecimalSlice :: struct {
  175. digits: []u8,
  176. count: int,
  177. decimal_point: int,
  178. neg: bool,
  179. }
  180. Float_Info :: struct {
  181. mantbits: uint,
  182. expbits: uint,
  183. bias: int,
  184. }
  185. _f16_info := Float_Info{10, 5, -15};
  186. _f32_info := Float_Info{23, 8, -127};
  187. _f64_info := Float_Info{52, 11, -1023};
  188. generic_ftoa :: proc(buf: []u8, val: f64, fmt: u8, prec, bit_size: int) -> []u8 {
  189. bits: u64;
  190. flt: ^Float_Info;
  191. match bit_size {
  192. case 32:
  193. bits = u64(transmute(u32, f32(val)));
  194. flt = &_f32_info;
  195. case 64:
  196. bits = transmute(u64, val);
  197. flt = &_f64_info;
  198. case:
  199. panic("strconv: invalid bit_size");
  200. }
  201. neg := bits>>(flt.expbits+flt.mantbits) != 0;
  202. exp := int(bits>>flt.mantbits) & (1<<flt.expbits - 1);
  203. mant := bits & (u64(1) << flt.mantbits - 1);
  204. match exp {
  205. case 1<<flt.expbits - 1:
  206. s: string;
  207. if mant != 0 {
  208. s = "NaN";
  209. } else if neg {
  210. s = "-Inf";
  211. } else {
  212. s = "+Inf";
  213. }
  214. append(buf, ..[]u8(s));
  215. return buf;
  216. case 0: // denormalized
  217. exp++;
  218. case:
  219. mant |= u64(1) << flt.mantbits;
  220. }
  221. exp += flt.bias;
  222. d_: Decimal;
  223. d := &d_;
  224. assign(d, mant);
  225. shift(d, exp - int(flt.mantbits));
  226. digs: DecimalSlice;
  227. shortest := prec < 0;
  228. if shortest {
  229. round_shortest(d, mant, exp, flt);
  230. digs = DecimalSlice{digits = d.digits[..], count = d.count, decimal_point = d.decimal_point};
  231. match fmt {
  232. case 'e', 'E': prec = digs.count-1;
  233. case 'f', 'F': prec = max(digs.count-digs.decimal_point, 0);
  234. case 'g', 'G': prec = digs.count;
  235. }
  236. } else {
  237. match fmt {
  238. case 'e', 'E': round(d, prec+1);
  239. case 'f', 'F': round(d, d.decimal_point+prec);
  240. case 'g', 'G':
  241. if prec == 0 {
  242. prec = 1;
  243. }
  244. round(d, prec);
  245. }
  246. digs = DecimalSlice{digits = d.digits[..], count = d.count, decimal_point = d.decimal_point};
  247. }
  248. return format_digits(buf, shortest, neg, digs, prec, fmt);
  249. }
  250. format_digits :: proc(buf: []u8, shortest: bool, neg: bool, digs: DecimalSlice, prec: int, fmt: u8) -> []u8 {
  251. match fmt {
  252. case 'f', 'F':
  253. append(buf, neg ? '-' : '+');
  254. // integer, padded with zeros when needed
  255. if digs.decimal_point > 0 {
  256. m := min(digs.count, digs.decimal_point);
  257. append(buf, ..digs.digits[0..<m]);
  258. for ; m < digs.decimal_point; m++ {
  259. append(buf, '0');
  260. }
  261. } else {
  262. append(buf, '0');
  263. }
  264. // fractional part
  265. if prec > 0 {
  266. append(buf, '.');
  267. for i in 0..<prec {
  268. c: u8 = '0';
  269. if j := digs.decimal_point + i; 0 <= j && j < digs.count {
  270. c = digs.digits[j];
  271. }
  272. append(buf, c);
  273. }
  274. }
  275. return buf;
  276. case 'e', 'E':
  277. panic("strconv: e/E float printing is not yet supported");
  278. return buf; // TODO
  279. case 'g', 'G':
  280. panic("strconv: g/G float printing is not yet supported");
  281. return buf; // TODO
  282. }
  283. c: [2]u8;
  284. c[0] = '%';
  285. c[1] = fmt;
  286. append(buf, ..c[..]);
  287. return buf;
  288. }
  289. round_shortest :: proc(d: ^Decimal, mant: u64, exp: int, flt: ^Float_Info) {
  290. if mant == 0 { // If mantissa is zero, the number is zero
  291. d.count = 0;
  292. return;
  293. }
  294. /*
  295. 10^(dp-nd) > 2^(exp-mantbits)
  296. log2(10) * (dp-nd) > exp-mantbits
  297. log(2) >~ 0.332
  298. 332*(dp-nd) >= 100*(exp-mantbits)
  299. */
  300. minexp := flt.bias+1;
  301. if exp > minexp && 332*(d.decimal_point-d.count) >= 100*(exp - int(flt.mantbits)) {
  302. // Number is already its shortest
  303. return;
  304. }
  305. upper_: Decimal; upper: = &upper_;
  306. assign(upper, 2*mant - 1);
  307. shift(upper, exp - int(flt.mantbits) - 1);
  308. mantlo: u64;
  309. explo: int;
  310. if mant > 1<<flt.mantbits || exp == minexp {
  311. mantlo = mant-1;
  312. explo = exp;
  313. } else {
  314. mantlo = 2*mant - 1;
  315. explo = exp-1;
  316. }
  317. lower_: Decimal; lower: = &lower_;
  318. assign(lower, 2*mantlo + 1);
  319. shift(lower, explo - int(flt.mantbits) - 1);
  320. inclusive := mant%2 == 0;
  321. for i in 0..<d.count {
  322. l: u8 = '0'; // lower digit
  323. if i < lower.count {
  324. l = lower.digits[i];
  325. }
  326. m := d.digits[i]; // middle digit
  327. u: u8 = '0'; // upper digit
  328. if i < upper.count {
  329. u = upper.digits[i];
  330. }
  331. ok_round_down := l != m || inclusive && i+1 == lower.count;
  332. ok_round_up := m != u && (inclusive || m+1 < u || i+1 < upper.count);
  333. if (ok_round_down && ok_round_up) {
  334. round(d, i+1);
  335. return;
  336. }
  337. if (ok_round_down) {
  338. round_down(d, i+1);
  339. return;
  340. }
  341. if (ok_round_up) {
  342. round_up(d, i+1);
  343. return;
  344. }
  345. }
  346. }
  347. MAX_BASE :: 32;
  348. immutable digits := "0123456789abcdefghijklmnopqrstuvwxyz";
  349. is_integer_negative :: proc(u: u128, is_signed: bool, bit_size: int) -> (unsigned: u128, neg: bool) {
  350. neg := false;
  351. if is_signed {
  352. match bit_size {
  353. case 8:
  354. i := i8(u);
  355. neg = i < 0;
  356. if neg { i = -i; }
  357. u = u128(i);
  358. case 16:
  359. i := i16(u);
  360. neg = i < 0;
  361. if neg { i = -i; }
  362. u = u128(i);
  363. case 32:
  364. i := i32(u);
  365. neg = i < 0;
  366. if neg { i = -i; }
  367. u = u128(i);
  368. case 64:
  369. i := i64(u);
  370. neg = i < 0;
  371. if neg { i = -i; }
  372. u = u128(i);
  373. case 128:
  374. i := i128(u);
  375. neg = i < 0;
  376. if neg { i = -i; }
  377. u = u128(i);
  378. case:
  379. panic("is_integer_negative: Unknown integer size");
  380. }
  381. }
  382. return u, neg;
  383. }
  384. append_bits :: proc(buf: []u8, u_: u128, base: int, is_signed: bool, bit_size: int, digits: string, flags: IntFlag) -> string {
  385. if base < 2 || base > MAX_BASE {
  386. panic("strconv: illegal base passed to append_bits");
  387. }
  388. a: [129]u8;
  389. i := len(a);
  390. u, neg := is_integer_negative(u_, is_signed, bit_size);
  391. b := u128(base);
  392. for u >= b {
  393. i--; a[i] = digits[uint(u % b)];
  394. u /= b;
  395. }
  396. i--; a[i] = digits[uint(u % b)];
  397. if flags&IntFlag.Prefix != 0 {
  398. ok := true;
  399. match base {
  400. case 2: i--; a[i] = 'b';
  401. case 8: i--; a[i] = 'o';
  402. case 10: i--; a[i] = 'd';
  403. case 12: i--; a[i] = 'z';
  404. case 16: i--; a[i] = 'x';
  405. case: ok = false;
  406. }
  407. if ok {
  408. i--; a[i] = '0';
  409. }
  410. }
  411. if neg {
  412. i--; a[i] = '-';
  413. } else if flags&IntFlag.Plus != 0 {
  414. i--; a[i] = '+';
  415. } else if flags&IntFlag.Space != 0 {
  416. i--; a[i] = ' ';
  417. }
  418. append(buf, ..a[i..]);
  419. return string(buf);
  420. }