json.cpp 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563
  1. /*************************************************************************/
  2. /* json.cpp */
  3. /*************************************************************************/
  4. /* This file is part of: */
  5. /* GODOT ENGINE */
  6. /* https://godotengine.org */
  7. /*************************************************************************/
  8. /* Copyright (c) 2007-2021 Juan Linietsky, Ariel Manzur. */
  9. /* Copyright (c) 2014-2021 Godot Engine contributors (cf. AUTHORS.md). */
  10. /* */
  11. /* Permission is hereby granted, free of charge, to any person obtaining */
  12. /* a copy of this software and associated documentation files (the */
  13. /* "Software"), to deal in the Software without restriction, including */
  14. /* without limitation the rights to use, copy, modify, merge, publish, */
  15. /* distribute, sublicense, and/or sell copies of the Software, and to */
  16. /* permit persons to whom the Software is furnished to do so, subject to */
  17. /* the following conditions: */
  18. /* */
  19. /* The above copyright notice and this permission notice shall be */
  20. /* included in all copies or substantial portions of the Software. */
  21. /* */
  22. /* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, */
  23. /* EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF */
  24. /* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.*/
  25. /* IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY */
  26. /* CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, */
  27. /* TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE */
  28. /* SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. */
  29. /*************************************************************************/
  30. #include "json.h"
  31. #include "core/string/print_string.h"
  32. const char *JSON::tk_name[TK_MAX] = {
  33. "'{'",
  34. "'}'",
  35. "'['",
  36. "']'",
  37. "identifier",
  38. "string",
  39. "number",
  40. "':'",
  41. "','",
  42. "EOF",
  43. };
  44. static String _make_indent(const String &p_indent, int p_size) {
  45. String indent_text = "";
  46. if (!p_indent.is_empty()) {
  47. for (int i = 0; i < p_size; i++) {
  48. indent_text += p_indent;
  49. }
  50. }
  51. return indent_text;
  52. }
  53. String JSON::_print_var(const Variant &p_var, const String &p_indent, int p_cur_indent, bool p_sort_keys, Set<const void *> &p_markers, bool p_full_precision) {
  54. String colon = ":";
  55. String end_statement = "";
  56. if (!p_indent.is_empty()) {
  57. colon += " ";
  58. end_statement += "\n";
  59. }
  60. switch (p_var.get_type()) {
  61. case Variant::NIL:
  62. return "null";
  63. case Variant::BOOL:
  64. return p_var.operator bool() ? "true" : "false";
  65. case Variant::INT:
  66. return itos(p_var);
  67. case Variant::FLOAT: {
  68. double num = p_var;
  69. if (p_full_precision) {
  70. // Store unreliable digits (17) instead of just reliable
  71. // digits (14) so that the value can be decoded exactly.
  72. return String::num(num, 17 - (int)floor(log10(num)));
  73. } else {
  74. // Store only reliable digits (14) by default.
  75. return String::num(num, 14 - (int)floor(log10(num)));
  76. }
  77. }
  78. case Variant::PACKED_INT32_ARRAY:
  79. case Variant::PACKED_INT64_ARRAY:
  80. case Variant::PACKED_FLOAT32_ARRAY:
  81. case Variant::PACKED_FLOAT64_ARRAY:
  82. case Variant::PACKED_STRING_ARRAY:
  83. case Variant::ARRAY: {
  84. String s = "[";
  85. s += end_statement;
  86. Array a = p_var;
  87. ERR_FAIL_COND_V_MSG(p_markers.has(a.id()), "\"[...]\"", "Converting circular structure to JSON.");
  88. p_markers.insert(a.id());
  89. for (int i = 0; i < a.size(); i++) {
  90. if (i > 0) {
  91. s += ",";
  92. s += end_statement;
  93. }
  94. s += _make_indent(p_indent, p_cur_indent + 1) + _print_var(a[i], p_indent, p_cur_indent + 1, p_sort_keys, p_markers);
  95. }
  96. s += end_statement + _make_indent(p_indent, p_cur_indent) + "]";
  97. p_markers.erase(a.id());
  98. return s;
  99. }
  100. case Variant::DICTIONARY: {
  101. String s = "{";
  102. s += end_statement;
  103. Dictionary d = p_var;
  104. ERR_FAIL_COND_V_MSG(p_markers.has(d.id()), "\"{...}\"", "Converting circular structure to JSON.");
  105. p_markers.insert(d.id());
  106. List<Variant> keys;
  107. d.get_key_list(&keys);
  108. if (p_sort_keys) {
  109. keys.sort();
  110. }
  111. for (List<Variant>::Element *E = keys.front(); E; E = E->next()) {
  112. if (E != keys.front()) {
  113. s += ",";
  114. s += end_statement;
  115. }
  116. s += _make_indent(p_indent, p_cur_indent + 1) + _print_var(String(E->get()), p_indent, p_cur_indent + 1, p_sort_keys, p_markers);
  117. s += colon;
  118. s += _print_var(d[E->get()], p_indent, p_cur_indent + 1, p_sort_keys, p_markers);
  119. }
  120. s += end_statement + _make_indent(p_indent, p_cur_indent) + "}";
  121. p_markers.erase(d.id());
  122. return s;
  123. }
  124. default:
  125. return "\"" + String(p_var).json_escape() + "\"";
  126. }
  127. }
  128. String JSON::print(const Variant &p_var, const String &p_indent, bool p_sort_keys, bool p_full_precision) {
  129. Set<const void *> markers;
  130. return _print_var(p_var, p_indent, 0, p_sort_keys, markers, p_full_precision);
  131. }
  132. Error JSON::_get_token(const char32_t *p_str, int &index, int p_len, Token &r_token, int &line, String &r_err_str) {
  133. while (p_len > 0) {
  134. switch (p_str[index]) {
  135. case '\n': {
  136. line++;
  137. index++;
  138. break;
  139. }
  140. case 0: {
  141. r_token.type = TK_EOF;
  142. return OK;
  143. } break;
  144. case '{': {
  145. r_token.type = TK_CURLY_BRACKET_OPEN;
  146. index++;
  147. return OK;
  148. }
  149. case '}': {
  150. r_token.type = TK_CURLY_BRACKET_CLOSE;
  151. index++;
  152. return OK;
  153. }
  154. case '[': {
  155. r_token.type = TK_BRACKET_OPEN;
  156. index++;
  157. return OK;
  158. }
  159. case ']': {
  160. r_token.type = TK_BRACKET_CLOSE;
  161. index++;
  162. return OK;
  163. }
  164. case ':': {
  165. r_token.type = TK_COLON;
  166. index++;
  167. return OK;
  168. }
  169. case ',': {
  170. r_token.type = TK_COMMA;
  171. index++;
  172. return OK;
  173. }
  174. case '"': {
  175. index++;
  176. String str;
  177. while (true) {
  178. if (p_str[index] == 0) {
  179. r_err_str = "Unterminated String";
  180. return ERR_PARSE_ERROR;
  181. } else if (p_str[index] == '"') {
  182. index++;
  183. break;
  184. } else if (p_str[index] == '\\') {
  185. //escaped characters...
  186. index++;
  187. char32_t next = p_str[index];
  188. if (next == 0) {
  189. r_err_str = "Unterminated String";
  190. return ERR_PARSE_ERROR;
  191. }
  192. char32_t res = 0;
  193. switch (next) {
  194. case 'b':
  195. res = 8;
  196. break;
  197. case 't':
  198. res = 9;
  199. break;
  200. case 'n':
  201. res = 10;
  202. break;
  203. case 'f':
  204. res = 12;
  205. break;
  206. case 'r':
  207. res = 13;
  208. break;
  209. case 'u': {
  210. // hex number
  211. for (int j = 0; j < 4; j++) {
  212. char32_t c = p_str[index + j + 1];
  213. if (c == 0) {
  214. r_err_str = "Unterminated String";
  215. return ERR_PARSE_ERROR;
  216. }
  217. if (!((c >= '0' && c <= '9') || (c >= 'a' && c <= 'f') || (c >= 'A' && c <= 'F'))) {
  218. r_err_str = "Malformed hex constant in string";
  219. return ERR_PARSE_ERROR;
  220. }
  221. char32_t v;
  222. if (c >= '0' && c <= '9') {
  223. v = c - '0';
  224. } else if (c >= 'a' && c <= 'f') {
  225. v = c - 'a';
  226. v += 10;
  227. } else if (c >= 'A' && c <= 'F') {
  228. v = c - 'A';
  229. v += 10;
  230. } else {
  231. ERR_PRINT("Bug parsing hex constant.");
  232. v = 0;
  233. }
  234. res <<= 4;
  235. res |= v;
  236. }
  237. index += 4; //will add at the end anyway
  238. if ((res & 0xfffffc00) == 0xd800) {
  239. if (p_str[index + 1] != '\\' || p_str[index + 2] != 'u') {
  240. r_err_str = "Invalid UTF-16 sequence in string, unpaired lead surrogate";
  241. return ERR_PARSE_ERROR;
  242. }
  243. index += 2;
  244. char32_t trail = 0;
  245. for (int j = 0; j < 4; j++) {
  246. char32_t c = p_str[index + j + 1];
  247. if (c == 0) {
  248. r_err_str = "Unterminated String";
  249. return ERR_PARSE_ERROR;
  250. }
  251. if (!((c >= '0' && c <= '9') || (c >= 'a' && c <= 'f') || (c >= 'A' && c <= 'F'))) {
  252. r_err_str = "Malformed hex constant in string";
  253. return ERR_PARSE_ERROR;
  254. }
  255. char32_t v;
  256. if (c >= '0' && c <= '9') {
  257. v = c - '0';
  258. } else if (c >= 'a' && c <= 'f') {
  259. v = c - 'a';
  260. v += 10;
  261. } else if (c >= 'A' && c <= 'F') {
  262. v = c - 'A';
  263. v += 10;
  264. } else {
  265. ERR_PRINT("Bug parsing hex constant.");
  266. v = 0;
  267. }
  268. trail <<= 4;
  269. trail |= v;
  270. }
  271. if ((trail & 0xfffffc00) == 0xdc00) {
  272. res = (res << 10UL) + trail - ((0xd800 << 10UL) + 0xdc00 - 0x10000);
  273. index += 4; //will add at the end anyway
  274. } else {
  275. r_err_str = "Invalid UTF-16 sequence in string, unpaired lead surrogate";
  276. return ERR_PARSE_ERROR;
  277. }
  278. } else if ((res & 0xfffffc00) == 0xdc00) {
  279. r_err_str = "Invalid UTF-16 sequence in string, unpaired trail surrogate";
  280. return ERR_PARSE_ERROR;
  281. }
  282. } break;
  283. default: {
  284. res = next;
  285. } break;
  286. }
  287. str += res;
  288. } else {
  289. if (p_str[index] == '\n') {
  290. line++;
  291. }
  292. str += p_str[index];
  293. }
  294. index++;
  295. }
  296. r_token.type = TK_STRING;
  297. r_token.value = str;
  298. return OK;
  299. } break;
  300. default: {
  301. if (p_str[index] <= 32) {
  302. index++;
  303. break;
  304. }
  305. if (p_str[index] == '-' || (p_str[index] >= '0' && p_str[index] <= '9')) {
  306. //a number
  307. const char32_t *rptr;
  308. double number = String::to_float(&p_str[index], &rptr);
  309. index += (rptr - &p_str[index]);
  310. r_token.type = TK_NUMBER;
  311. r_token.value = number;
  312. return OK;
  313. } else if ((p_str[index] >= 'A' && p_str[index] <= 'Z') || (p_str[index] >= 'a' && p_str[index] <= 'z')) {
  314. String id;
  315. while ((p_str[index] >= 'A' && p_str[index] <= 'Z') || (p_str[index] >= 'a' && p_str[index] <= 'z')) {
  316. id += p_str[index];
  317. index++;
  318. }
  319. r_token.type = TK_IDENTIFIER;
  320. r_token.value = id;
  321. return OK;
  322. } else {
  323. r_err_str = "Unexpected character.";
  324. return ERR_PARSE_ERROR;
  325. }
  326. }
  327. }
  328. }
  329. return ERR_PARSE_ERROR;
  330. }
  331. Error JSON::_parse_value(Variant &value, Token &token, const char32_t *p_str, int &index, int p_len, int &line, String &r_err_str) {
  332. if (token.type == TK_CURLY_BRACKET_OPEN) {
  333. Dictionary d;
  334. Error err = _parse_object(d, p_str, index, p_len, line, r_err_str);
  335. if (err) {
  336. return err;
  337. }
  338. value = d;
  339. } else if (token.type == TK_BRACKET_OPEN) {
  340. Array a;
  341. Error err = _parse_array(a, p_str, index, p_len, line, r_err_str);
  342. if (err) {
  343. return err;
  344. }
  345. value = a;
  346. } else if (token.type == TK_IDENTIFIER) {
  347. String id = token.value;
  348. if (id == "true") {
  349. value = true;
  350. } else if (id == "false") {
  351. value = false;
  352. } else if (id == "null") {
  353. value = Variant();
  354. } else {
  355. r_err_str = "Expected 'true','false' or 'null', got '" + id + "'.";
  356. return ERR_PARSE_ERROR;
  357. }
  358. } else if (token.type == TK_NUMBER) {
  359. value = token.value;
  360. } else if (token.type == TK_STRING) {
  361. value = token.value;
  362. } else {
  363. r_err_str = "Expected value, got " + String(tk_name[token.type]) + ".";
  364. return ERR_PARSE_ERROR;
  365. }
  366. return OK;
  367. }
  368. Error JSON::_parse_array(Array &array, const char32_t *p_str, int &index, int p_len, int &line, String &r_err_str) {
  369. Token token;
  370. bool need_comma = false;
  371. while (index < p_len) {
  372. Error err = _get_token(p_str, index, p_len, token, line, r_err_str);
  373. if (err != OK) {
  374. return err;
  375. }
  376. if (token.type == TK_BRACKET_CLOSE) {
  377. return OK;
  378. }
  379. if (need_comma) {
  380. if (token.type != TK_COMMA) {
  381. r_err_str = "Expected ','";
  382. return ERR_PARSE_ERROR;
  383. } else {
  384. need_comma = false;
  385. continue;
  386. }
  387. }
  388. Variant v;
  389. err = _parse_value(v, token, p_str, index, p_len, line, r_err_str);
  390. if (err) {
  391. return err;
  392. }
  393. array.push_back(v);
  394. need_comma = true;
  395. }
  396. r_err_str = "Expected ']'";
  397. return ERR_PARSE_ERROR;
  398. }
  399. Error JSON::_parse_object(Dictionary &object, const char32_t *p_str, int &index, int p_len, int &line, String &r_err_str) {
  400. bool at_key = true;
  401. String key;
  402. Token token;
  403. bool need_comma = false;
  404. while (index < p_len) {
  405. if (at_key) {
  406. Error err = _get_token(p_str, index, p_len, token, line, r_err_str);
  407. if (err != OK) {
  408. return err;
  409. }
  410. if (token.type == TK_CURLY_BRACKET_CLOSE) {
  411. return OK;
  412. }
  413. if (need_comma) {
  414. if (token.type != TK_COMMA) {
  415. r_err_str = "Expected '}' or ','";
  416. return ERR_PARSE_ERROR;
  417. } else {
  418. need_comma = false;
  419. continue;
  420. }
  421. }
  422. if (token.type != TK_STRING) {
  423. r_err_str = "Expected key";
  424. return ERR_PARSE_ERROR;
  425. }
  426. key = token.value;
  427. err = _get_token(p_str, index, p_len, token, line, r_err_str);
  428. if (err != OK) {
  429. return err;
  430. }
  431. if (token.type != TK_COLON) {
  432. r_err_str = "Expected ':'";
  433. return ERR_PARSE_ERROR;
  434. }
  435. at_key = false;
  436. } else {
  437. Error err = _get_token(p_str, index, p_len, token, line, r_err_str);
  438. if (err != OK) {
  439. return err;
  440. }
  441. Variant v;
  442. err = _parse_value(v, token, p_str, index, p_len, line, r_err_str);
  443. if (err) {
  444. return err;
  445. }
  446. object[key] = v;
  447. need_comma = true;
  448. at_key = true;
  449. }
  450. }
  451. r_err_str = "Expected '}'";
  452. return ERR_PARSE_ERROR;
  453. }
  454. Error JSON::parse(const String &p_json, Variant &r_ret, String &r_err_str, int &r_err_line) {
  455. const char32_t *str = p_json.ptr();
  456. int idx = 0;
  457. int len = p_json.length();
  458. Token token;
  459. r_err_line = 0;
  460. String aux_key;
  461. Error err = _get_token(str, idx, len, token, r_err_line, r_err_str);
  462. if (err) {
  463. return err;
  464. }
  465. err = _parse_value(r_ret, token, str, idx, len, r_err_line, r_err_str);
  466. // Check if EOF is reached
  467. // or it's a type of the next token.
  468. if (err == OK && idx < len) {
  469. err = _get_token(str, idx, len, token, r_err_line, r_err_str);
  470. if (err || token.type != TK_EOF) {
  471. r_err_str = "Expected 'EOF'";
  472. // Reset return value to empty `Variant`
  473. r_ret = Variant();
  474. return ERR_PARSE_ERROR;
  475. }
  476. }
  477. return err;
  478. }
  479. Error JSONParser::parse_string(const String &p_json_string) {
  480. return JSON::parse(p_json_string, data, err_text, err_line);
  481. }
  482. String JSONParser::get_error_text() const {
  483. return err_text;
  484. }
  485. int JSONParser::get_error_line() const {
  486. return err_line;
  487. }
  488. Variant JSONParser::get_data() const {
  489. return data;
  490. }
  491. Error JSONParser::decode_data(const Variant &p_data, const String &p_indent, bool p_sort_keys) {
  492. string = JSON::print(p_data, p_indent, p_sort_keys);
  493. data = p_data;
  494. return OK;
  495. }
  496. String JSONParser::get_string() const {
  497. return string;
  498. }
  499. void JSONParser::_bind_methods() {
  500. ClassDB::bind_method(D_METHOD("parse_string", "json_string"), &JSONParser::parse_string);
  501. ClassDB::bind_method(D_METHOD("get_error_text"), &JSONParser::get_error_text);
  502. ClassDB::bind_method(D_METHOD("get_error_line"), &JSONParser::get_error_line);
  503. ClassDB::bind_method(D_METHOD("get_data"), &JSONParser::get_data);
  504. ClassDB::bind_method(D_METHOD("decode_data", "data", "indent", "sort_keys"), &JSONParser::decode_data, DEFVAL(""), DEFVAL(true));
  505. ClassDB::bind_method(D_METHOD("get_string"), &JSONParser::get_string);
  506. }