marshal.odin 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670
  1. package encoding_json
  2. import "core:mem"
  3. import "core:math/bits"
  4. import "base:runtime"
  5. import "core:strconv"
  6. import "core:strings"
  7. import "core:reflect"
  8. import "core:io"
  9. import "core:slice"
  10. Marshal_Data_Error :: enum {
  11. None,
  12. Unsupported_Type,
  13. }
  14. Marshal_Error :: union #shared_nil {
  15. Marshal_Data_Error,
  16. io.Error,
  17. }
  18. // careful with MJSON maps & non quotes usage as keys with whitespace will lead to bad results
  19. Marshal_Options :: struct {
  20. // output based on spec
  21. spec: Specification,
  22. // Use line breaks & tabs/spaces
  23. pretty: bool,
  24. // Use spaces for indentation instead of tabs
  25. use_spaces: bool,
  26. // Given use_spaces true, use this many spaces per indent level. 0 means 4 spaces.
  27. spaces: int,
  28. // Output uint as hex in JSON5 & MJSON
  29. write_uint_as_hex: bool,
  30. // If spec is MJSON and this is true, then keys will be quoted.
  31. //
  32. // WARNING: If your keys contain whitespace and this is false, then the
  33. // output will be bad.
  34. mjson_keys_use_quotes: bool,
  35. // If spec is MJSON and this is true, then use '=' as delimiter between
  36. // keys and values, otherwise ':' is used.
  37. mjson_keys_use_equal_sign: bool,
  38. // When outputting a map, sort the output by key.
  39. //
  40. // NOTE: This will temp allocate and sort a list for each map.
  41. sort_maps_by_key: bool,
  42. // Output enum value's name instead of its underlying value.
  43. //
  44. // NOTE: If a name isn't found it'll use the underlying value.
  45. use_enum_names: bool,
  46. // Internal state
  47. indentation: int,
  48. mjson_skipped_first_braces_start: bool,
  49. mjson_skipped_first_braces_end: bool,
  50. }
  51. marshal :: proc(v: any, opt: Marshal_Options = {}, allocator := context.allocator, loc := #caller_location) -> (data: []byte, err: Marshal_Error) {
  52. b := strings.builder_make(allocator, loc)
  53. defer if err != nil {
  54. strings.builder_destroy(&b)
  55. }
  56. // temp guard in case we are sorting map keys, which will use temp allocations
  57. runtime.DEFAULT_TEMP_ALLOCATOR_TEMP_GUARD(ignore = allocator == context.temp_allocator)
  58. opt := opt
  59. marshal_to_builder(&b, v, &opt) or_return
  60. if len(b.buf) != 0 {
  61. data = b.buf[:]
  62. }
  63. return data, nil
  64. }
  65. marshal_to_builder :: proc(b: ^strings.Builder, v: any, opt: ^Marshal_Options) -> Marshal_Error {
  66. return marshal_to_writer(strings.to_writer(b), v, opt)
  67. }
  68. marshal_to_writer :: proc(w: io.Writer, v: any, opt: ^Marshal_Options) -> (err: Marshal_Error) {
  69. if v == nil {
  70. io.write_string(w, "null") or_return
  71. return
  72. }
  73. ti := runtime.type_info_base(type_info_of(v.id))
  74. a := any{v.data, ti.id}
  75. switch info in ti.variant {
  76. case runtime.Type_Info_Named:
  77. unreachable()
  78. case runtime.Type_Info_Integer:
  79. buf: [40]byte
  80. u := cast_any_int_to_u128(a)
  81. s: string
  82. // allow uints to be printed as hex
  83. if opt.write_uint_as_hex && (opt.spec == .JSON5 || opt.spec == .MJSON) {
  84. switch i in a {
  85. case u8, u16, u32, u64, u128:
  86. s = strconv.append_bits_128(buf[:], u, 16, info.signed, 8*ti.size, "0123456789abcdef", { .Prefix })
  87. case:
  88. s = strconv.append_bits_128(buf[:], u, 10, info.signed, 8*ti.size, "0123456789", nil)
  89. }
  90. } else {
  91. s = strconv.append_bits_128(buf[:], u, 10, info.signed, 8*ti.size, "0123456789", nil)
  92. }
  93. io.write_string(w, s) or_return
  94. case runtime.Type_Info_Rune:
  95. r := a.(rune)
  96. io.write_byte(w, '"') or_return
  97. io.write_escaped_rune(w, r, '"', true) or_return
  98. io.write_byte(w, '"') or_return
  99. case runtime.Type_Info_Float:
  100. switch f in a {
  101. case f16: io.write_f16(w, f) or_return
  102. case f32: io.write_f32(w, f) or_return
  103. case f64: io.write_f64(w, f) or_return
  104. case: return .Unsupported_Type
  105. }
  106. case runtime.Type_Info_Complex:
  107. r, i: f64
  108. switch z in a {
  109. case complex32: r, i = f64(real(z)), f64(imag(z))
  110. case complex64: r, i = f64(real(z)), f64(imag(z))
  111. case complex128: r, i = f64(real(z)), f64(imag(z))
  112. case: return .Unsupported_Type
  113. }
  114. io.write_byte(w, '[') or_return
  115. io.write_f64(w, r) or_return
  116. io.write_string(w, ", ") or_return
  117. io.write_f64(w, i) or_return
  118. io.write_byte(w, ']') or_return
  119. case runtime.Type_Info_Quaternion:
  120. return .Unsupported_Type
  121. case runtime.Type_Info_String:
  122. switch s in a {
  123. case string: io.write_quoted_string(w, s, '"', nil, true) or_return
  124. case cstring: io.write_quoted_string(w, string(s), '"', nil, true) or_return
  125. }
  126. case runtime.Type_Info_Boolean:
  127. val: bool
  128. switch b in a {
  129. case bool: val = bool(b)
  130. case b8: val = bool(b)
  131. case b16: val = bool(b)
  132. case b32: val = bool(b)
  133. case b64: val = bool(b)
  134. }
  135. io.write_string(w, val ? "true" : "false") or_return
  136. case runtime.Type_Info_Any:
  137. return .Unsupported_Type
  138. case runtime.Type_Info_Type_Id:
  139. return .Unsupported_Type
  140. case runtime.Type_Info_Pointer:
  141. return .Unsupported_Type
  142. case runtime.Type_Info_Multi_Pointer:
  143. return .Unsupported_Type
  144. case runtime.Type_Info_Soa_Pointer:
  145. return .Unsupported_Type
  146. case runtime.Type_Info_Procedure:
  147. return .Unsupported_Type
  148. case runtime.Type_Info_Parameters:
  149. return .Unsupported_Type
  150. case runtime.Type_Info_Simd_Vector:
  151. return .Unsupported_Type
  152. case runtime.Type_Info_Matrix:
  153. return .Unsupported_Type
  154. case runtime.Type_Info_Bit_Field:
  155. return .Unsupported_Type
  156. case runtime.Type_Info_Array:
  157. opt_write_start(w, opt, '[') or_return
  158. for i in 0..<info.count {
  159. opt_write_iteration(w, opt, i == 0) or_return
  160. data := uintptr(v.data) + uintptr(i*info.elem_size)
  161. marshal_to_writer(w, any{rawptr(data), info.elem.id}, opt) or_return
  162. }
  163. opt_write_end(w, opt, ']') or_return
  164. case runtime.Type_Info_Enumerated_Array:
  165. opt_write_start(w, opt, '[') or_return
  166. for i in 0..<info.count {
  167. opt_write_iteration(w, opt, i == 0) or_return
  168. data := uintptr(v.data) + uintptr(i*info.elem_size)
  169. marshal_to_writer(w, any{rawptr(data), info.elem.id}, opt) or_return
  170. }
  171. opt_write_end(w, opt, ']') or_return
  172. case runtime.Type_Info_Dynamic_Array:
  173. opt_write_start(w, opt, '[') or_return
  174. array := cast(^mem.Raw_Dynamic_Array)v.data
  175. for i in 0..<array.len {
  176. opt_write_iteration(w, opt, i == 0) or_return
  177. data := uintptr(array.data) + uintptr(i*info.elem_size)
  178. marshal_to_writer(w, any{rawptr(data), info.elem.id}, opt) or_return
  179. }
  180. opt_write_end(w, opt, ']') or_return
  181. case runtime.Type_Info_Slice:
  182. opt_write_start(w, opt, '[') or_return
  183. slice := cast(^mem.Raw_Slice)v.data
  184. for i in 0..<slice.len {
  185. opt_write_iteration(w, opt, i == 0) or_return
  186. data := uintptr(slice.data) + uintptr(i*info.elem_size)
  187. marshal_to_writer(w, any{rawptr(data), info.elem.id}, opt) or_return
  188. }
  189. opt_write_end(w, opt, ']') or_return
  190. case runtime.Type_Info_Map:
  191. m := (^mem.Raw_Map)(v.data)
  192. opt_write_start(w, opt, '{') or_return
  193. if m != nil {
  194. if info.map_info == nil {
  195. return .Unsupported_Type
  196. }
  197. map_cap := uintptr(runtime.map_cap(m^))
  198. ks, vs, hs, _, _ := runtime.map_kvh_data_dynamic(m^, info.map_info)
  199. if !opt.sort_maps_by_key {
  200. i := 0
  201. for bucket_index in 0..<map_cap {
  202. runtime.map_hash_is_valid(hs[bucket_index]) or_continue
  203. opt_write_iteration(w, opt, i == 0) or_return
  204. i += 1
  205. key := rawptr(runtime.map_cell_index_dynamic(ks, info.map_info.ks, bucket_index))
  206. value := rawptr(runtime.map_cell_index_dynamic(vs, info.map_info.vs, bucket_index))
  207. // check for string type
  208. {
  209. kv := any{key, info.key.id}
  210. kti := runtime.type_info_base(type_info_of(kv.id))
  211. ka := any{kv.data, kti.id}
  212. name: string
  213. #partial switch info in kti.variant {
  214. case runtime.Type_Info_String:
  215. switch s in ka {
  216. case string: name = s
  217. case cstring: name = string(s)
  218. }
  219. opt_write_key(w, opt, name) or_return
  220. case runtime.Type_Info_Integer:
  221. buf: [40]byte
  222. u := cast_any_int_to_u128(ka)
  223. name = strconv.append_bits_128(buf[:], u, 10, info.signed, 8*kti.size, "0123456789", nil)
  224. opt_write_key(w, opt, name) or_return
  225. case: return .Unsupported_Type
  226. }
  227. }
  228. marshal_to_writer(w, any{value, info.value.id}, opt) or_return
  229. }
  230. } else {
  231. Entry :: struct {
  232. key: string,
  233. value: any,
  234. }
  235. // If we are sorting the map by key, then we temp alloc an array
  236. // and sort it, then output the result.
  237. sorted := make([dynamic]Entry, 0, map_cap, context.temp_allocator)
  238. for bucket_index in 0..<map_cap {
  239. runtime.map_hash_is_valid(hs[bucket_index]) or_continue
  240. key := rawptr(runtime.map_cell_index_dynamic(ks, info.map_info.ks, bucket_index))
  241. value := rawptr(runtime.map_cell_index_dynamic(vs, info.map_info.vs, bucket_index))
  242. name: string
  243. // check for string type
  244. {
  245. kv := any{key, info.key.id}
  246. kti := runtime.type_info_base(type_info_of(kv.id))
  247. ka := any{kv.data, kti.id}
  248. #partial switch info in kti.variant {
  249. case runtime.Type_Info_String:
  250. switch s in ka {
  251. case string: name = s
  252. case cstring: name = string(s)
  253. }
  254. case: return .Unsupported_Type
  255. }
  256. }
  257. append(&sorted, Entry { key = name, value = any{value, info.value.id}})
  258. }
  259. slice.sort_by(sorted[:], proc(i, j: Entry) -> bool { return i.key < j.key })
  260. for s, i in sorted {
  261. opt_write_iteration(w, opt, i == 0) or_return
  262. opt_write_key(w, opt, s.key) or_return
  263. marshal_to_writer(w, s.value, opt) or_return
  264. }
  265. }
  266. }
  267. opt_write_end(w, opt, '}') or_return
  268. case runtime.Type_Info_Struct:
  269. is_omitempty :: proc(v: any) -> bool {
  270. v := v
  271. if v == nil {
  272. return true
  273. }
  274. ti := runtime.type_info_core(type_info_of(v.id))
  275. #partial switch info in ti.variant {
  276. case runtime.Type_Info_String:
  277. switch x in v {
  278. case string:
  279. return x == ""
  280. case cstring:
  281. return x == nil || x == ""
  282. }
  283. case runtime.Type_Info_Any:
  284. return v.(any) == nil
  285. case runtime.Type_Info_Type_Id:
  286. return v.(typeid) == nil
  287. case runtime.Type_Info_Pointer,
  288. runtime.Type_Info_Multi_Pointer,
  289. runtime.Type_Info_Procedure:
  290. return (^rawptr)(v.data)^ == nil
  291. case runtime.Type_Info_Dynamic_Array:
  292. return (^runtime.Raw_Dynamic_Array)(v.data).len == 0
  293. case runtime.Type_Info_Slice:
  294. return (^runtime.Raw_Slice)(v.data).len == 0
  295. case runtime.Type_Info_Union,
  296. runtime.Type_Info_Bit_Set,
  297. runtime.Type_Info_Soa_Pointer:
  298. return reflect.is_nil(v)
  299. case runtime.Type_Info_Map:
  300. return (^runtime.Raw_Map)(v.data).len == 0
  301. }
  302. return false
  303. }
  304. marshal_struct_fields :: proc(w: io.Writer, v: any, opt: ^Marshal_Options) -> (err: Marshal_Error) {
  305. ti := runtime.type_info_base(type_info_of(v.id))
  306. info := ti.variant.(runtime.Type_Info_Struct)
  307. first_iteration := true
  308. for name, i in info.names[:info.field_count] {
  309. omitempty := false
  310. json_name, extra := json_name_from_tag_value(reflect.struct_tag_get(reflect.Struct_Tag(info.tags[i]), "json"))
  311. if json_name == "-" {
  312. continue
  313. }
  314. for flag in strings.split_iterator(&extra, ",") {
  315. switch flag {
  316. case "omitempty":
  317. omitempty = true
  318. }
  319. }
  320. id := info.types[i].id
  321. data := rawptr(uintptr(v.data) + info.offsets[i])
  322. the_value := any{data, id}
  323. if omitempty && is_omitempty(the_value) {
  324. continue
  325. }
  326. opt_write_iteration(w, opt, first_iteration) or_return
  327. first_iteration = false
  328. if json_name != "" {
  329. opt_write_key(w, opt, json_name) or_return
  330. } else {
  331. // Marshal the fields of 'using _: T' fields directly into the parent struct
  332. if info.usings[i] && name == "_" {
  333. marshal_struct_fields(w, the_value, opt) or_return
  334. continue
  335. } else {
  336. opt_write_key(w, opt, name) or_return
  337. }
  338. }
  339. marshal_to_writer(w, the_value, opt) or_return
  340. }
  341. return
  342. }
  343. opt_write_start(w, opt, '{') or_return
  344. marshal_struct_fields(w, v, opt) or_return
  345. opt_write_end(w, opt, '}') or_return
  346. case runtime.Type_Info_Union:
  347. if len(info.variants) == 0 || v.data == nil {
  348. io.write_string(w, "null") or_return
  349. return nil
  350. }
  351. tag_ptr := uintptr(v.data) + info.tag_offset
  352. tag_any := any{rawptr(tag_ptr), info.tag_type.id}
  353. tag: i64 = -1
  354. switch i in tag_any {
  355. case u8: tag = i64(i)
  356. case i8: tag = i64(i)
  357. case u16: tag = i64(i)
  358. case i16: tag = i64(i)
  359. case u32: tag = i64(i)
  360. case i32: tag = i64(i)
  361. case u64: tag = i64(i)
  362. case i64: tag = i64(i)
  363. case: panic("Invalid union tag type")
  364. }
  365. if !info.no_nil {
  366. if tag == 0 {
  367. io.write_string(w, "null") or_return
  368. return nil
  369. }
  370. tag -= 1
  371. }
  372. id := info.variants[tag].id
  373. return marshal_to_writer(w, any{v.data, id}, opt)
  374. case runtime.Type_Info_Enum:
  375. if !opt.use_enum_names || len(info.names) == 0 {
  376. return marshal_to_writer(w, any{v.data, info.base.id}, opt)
  377. } else {
  378. name, found := reflect.enum_name_from_value_any(v)
  379. if found {
  380. return marshal_to_writer(w, name, opt)
  381. } else {
  382. return marshal_to_writer(w, any{v.data, info.base.id}, opt)
  383. }
  384. }
  385. case runtime.Type_Info_Bit_Set:
  386. is_bit_set_different_endian_to_platform :: proc(ti: ^runtime.Type_Info) -> bool {
  387. if ti == nil {
  388. return false
  389. }
  390. t := runtime.type_info_base(ti)
  391. #partial switch info in t.variant {
  392. case runtime.Type_Info_Integer:
  393. switch info.endianness {
  394. case .Platform: return false
  395. case .Little: return ODIN_ENDIAN != .Little
  396. case .Big: return ODIN_ENDIAN != .Big
  397. }
  398. }
  399. return false
  400. }
  401. bit_data: u64
  402. bit_size := u64(8*ti.size)
  403. do_byte_swap := is_bit_set_different_endian_to_platform(info.underlying)
  404. switch bit_size {
  405. case 0: bit_data = 0
  406. case 8:
  407. x := (^u8)(v.data)^
  408. bit_data = u64(x)
  409. case 16:
  410. x := (^u16)(v.data)^
  411. if do_byte_swap {
  412. x = bits.byte_swap(x)
  413. }
  414. bit_data = u64(x)
  415. case 32:
  416. x := (^u32)(v.data)^
  417. if do_byte_swap {
  418. x = bits.byte_swap(x)
  419. }
  420. bit_data = u64(x)
  421. case 64:
  422. x := (^u64)(v.data)^
  423. if do_byte_swap {
  424. x = bits.byte_swap(x)
  425. }
  426. bit_data = u64(x)
  427. case: panic("unknown bit_size size")
  428. }
  429. io.write_u64(w, bit_data) or_return
  430. }
  431. return
  432. }
  433. // write key as quoted string or with optional quotes in mjson
  434. opt_write_key :: proc(w: io.Writer, opt: ^Marshal_Options, name: string) -> (err: io.Error) {
  435. switch opt.spec {
  436. case .JSON, .JSON5:
  437. io.write_quoted_string(w, name) or_return
  438. io.write_string(w, ": " if opt.pretty else ":") or_return
  439. case .MJSON:
  440. if opt.mjson_keys_use_quotes {
  441. io.write_quoted_string(w, name) or_return
  442. } else {
  443. io.write_string(w, name) or_return
  444. }
  445. if opt.mjson_keys_use_equal_sign {
  446. io.write_string(w, " = " if opt.pretty else "=") or_return
  447. } else {
  448. io.write_string(w, ": " if opt.pretty else ":") or_return
  449. }
  450. }
  451. return
  452. }
  453. // insert start byte and increase indentation on pretty
  454. opt_write_start :: proc(w: io.Writer, opt: ^Marshal_Options, c: byte) -> (err: io.Error) {
  455. // Skip MJSON starting braces. We make sure to only do this for c == '{',
  456. // skipping a starting '[' is not allowed.
  457. if opt.spec == .MJSON && !opt.mjson_skipped_first_braces_start && opt.indentation == 0 && c == '{' {
  458. opt.mjson_skipped_first_braces_start = true
  459. return
  460. }
  461. io.write_byte(w, c) or_return
  462. opt.indentation += 1
  463. if opt.pretty {
  464. io.write_byte(w, '\n') or_return
  465. }
  466. return
  467. }
  468. // insert comma separation and write indentations
  469. opt_write_iteration :: proc(w: io.Writer, opt: ^Marshal_Options, first_iteration: bool) -> (err: io.Error) {
  470. switch opt.spec {
  471. case .JSON, .JSON5:
  472. if !first_iteration {
  473. io.write_byte(w, ',') or_return
  474. if opt.pretty {
  475. io.write_byte(w, '\n') or_return
  476. }
  477. }
  478. opt_write_indentation(w, opt) or_return
  479. case .MJSON:
  480. if !first_iteration {
  481. // on pretty no commas necessary
  482. if opt.pretty {
  483. io.write_byte(w, '\n') or_return
  484. } else {
  485. // comma separation necessary for non pretty output!
  486. io.write_byte(w, ',') or_return
  487. }
  488. }
  489. opt_write_indentation(w, opt) or_return
  490. }
  491. return
  492. }
  493. // decrease indent, write spacing and insert end byte
  494. opt_write_end :: proc(w: io.Writer, opt: ^Marshal_Options, c: byte) -> (err: io.Error) {
  495. if opt.spec == .MJSON && opt.mjson_skipped_first_braces_start && !opt.mjson_skipped_first_braces_end && opt.indentation == 0 && c == '}' {
  496. opt.mjson_skipped_first_braces_end = true
  497. return
  498. }
  499. opt.indentation -= 1
  500. if opt.pretty {
  501. io.write_byte(w, '\n') or_return
  502. opt_write_indentation(w, opt) or_return
  503. }
  504. io.write_byte(w, c) or_return
  505. return
  506. }
  507. // writes current indentation level based on options
  508. opt_write_indentation :: proc(w: io.Writer, opt: ^Marshal_Options) -> (err: io.Error) {
  509. if !opt.pretty {
  510. return
  511. }
  512. if opt.use_spaces {
  513. spaces := opt.spaces == 0 ? 4 : opt.spaces
  514. for _ in 0..<opt.indentation * spaces {
  515. io.write_byte(w, ' ') or_return
  516. }
  517. } else {
  518. for _ in 0..<opt.indentation {
  519. io.write_byte(w, '\t') or_return
  520. }
  521. }
  522. return
  523. }
  524. @(private)
  525. cast_any_int_to_u128 :: proc(any_int_value: any) -> u128 {
  526. u: u128 = 0
  527. switch i in any_int_value {
  528. case i8: u = u128(i)
  529. case i16: u = u128(i)
  530. case i32: u = u128(i)
  531. case i64: u = u128(i)
  532. case i128: u = u128(i)
  533. case int: u = u128(i)
  534. case u8: u = u128(i)
  535. case u16: u = u128(i)
  536. case u32: u = u128(i)
  537. case u64: u = u128(i)
  538. case u128: u = u128(i)
  539. case uint: u = u128(i)
  540. case uintptr: u = u128(i)
  541. case i16le: u = u128(i)
  542. case i32le: u = u128(i)
  543. case i64le: u = u128(i)
  544. case u16le: u = u128(i)
  545. case u32le: u = u128(i)
  546. case u64le: u = u128(i)
  547. case u128le: u = u128(i)
  548. case i16be: u = u128(i)
  549. case i32be: u = u128(i)
  550. case i64be: u = u128(i)
  551. case u16be: u = u128(i)
  552. case u32be: u = u128(i)
  553. case u64be: u = u128(i)
  554. case u128be: u = u128(i)
  555. }
  556. return u
  557. }