StringTest.cpp 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293
  1. #include "../testTools.h"
  2. // TODO: Cannot use casting to parent type at the same time as automatic conversion from const char*
  3. // Cover everything using a single dsr::String type?
  4. // Use "" operand as only constructor?
  5. void fooInPlace(dsr::String& target, const dsr::ReadableString& a, const dsr::ReadableString& b) {
  6. string_clear(target);
  7. target.append(U"Foo(");
  8. target.append(a);
  9. target.appendChar(U',');
  10. target.append(b);
  11. target.appendChar(U')');
  12. }
  13. dsr::String foo(const dsr::ReadableString& a, const dsr::ReadableString& b) {
  14. dsr::String result;
  15. result.reserve(string_length(a) + string_length(b) + 6);
  16. fooInPlace(result, a, b);
  17. return result;
  18. }
  19. START_TEST(String)
  20. { // Length
  21. ASSERT_EQUAL(string_length(dsr::String()), 0);
  22. ASSERT_EQUAL(string_length(U""), 0);
  23. ASSERT_EQUAL(string_length(U"a"), 1);
  24. ASSERT_EQUAL(string_length(U"ab"), 2);
  25. ASSERT_EQUAL(string_length(U"abc"), 3);
  26. ASSERT_EQUAL(string_length(U"0123456789"), 10);
  27. }
  28. { // Reading characters
  29. ASSERT_EQUAL(dsr::ReadableString(U"ABC")[0], U'A');
  30. ASSERT_EQUAL(dsr::ReadableString(U"ABC")[1], U'B');
  31. ASSERT_EQUAL(dsr::ReadableString(U"ABC")[2], U'C');
  32. ASSERT_EQUAL(dsr::ReadableString(U"ABC")[3], U'\0');
  33. ASSERT_EQUAL(dsr::ReadableString(U"ABC")[10], U'\0');
  34. ASSERT_EQUAL(dsr::ReadableString(U"ABC")[1000000], U'\0');
  35. ASSERT_EQUAL(dsr::ReadableString(U"ABC")[-1], U'\0');
  36. ASSERT_EQUAL(dsr::ReadableString(U"ABC")[-1000000], U'\0');
  37. ASSERT_EQUAL(dsr::ReadableString(U"")[-1], U'\0');
  38. ASSERT_EQUAL(dsr::ReadableString(U"")[0], U'\0');
  39. ASSERT_EQUAL(dsr::ReadableString(U"")[1], U'\0');
  40. }
  41. { // Comparison
  42. dsr::ReadableString litA = U"Testing \u0444";
  43. dsr::ReadableString litB = U"Testing ф";
  44. ASSERT(string_match(litA, litB));
  45. ASSERT(!string_match(litA, U"wrong"));
  46. ASSERT(!string_match(U"wrong", litB));
  47. ASSERT(dsr::string_caseInsensitiveMatch(U"abc 123!", U"ABC 123!"));
  48. ASSERT(!dsr::string_caseInsensitiveMatch(U"abc 123!", U"ABD 123!"));
  49. ASSERT(dsr::string_match(U"aBc 123!", U"aBc 123!"));
  50. ASSERT(!dsr::string_match(U"abc 123!", U"ABC 123!"));
  51. }
  52. { // Concatenation
  53. dsr::String ab = dsr::string_combine(U"a", U"b");
  54. ASSERT_MATCH(ab, U"ab");
  55. dsr::String cd = dsr::string_combine(U"c", U"d");
  56. ASSERT_MATCH(cd, U"cd");
  57. cd = dsr::string_combine(U"c", U"d");
  58. ASSERT_MATCH(cd, U"cd");
  59. auto abcd = ab + cd;
  60. ASSERT_MATCH(abcd, U"abcd");
  61. ASSERT_MATCH(dsr::string_combine(U"a", U"b", U"c", "d"), U"abcd");
  62. }
  63. { // Sub-strings
  64. dsr::ReadableString abcd = U"abcd";
  65. dsr::String efgh = U"efgh";
  66. ASSERT_MATCH(dsr::string_inclusiveRange(abcd, 0, 3), U"abcd");
  67. ASSERT_MATCH(dsr::string_exclusiveRange(abcd, 1, 2), U"b");
  68. ASSERT_MATCH(dsr::string_inclusiveRange(efgh, 2, 3), U"gh");
  69. ASSERT_MATCH(dsr::string_exclusiveRange(efgh, 3, 4), U"h");
  70. ASSERT_MATCH(dsr::string_combine(string_from(abcd, 2), string_before(efgh, 2)), U"cdef");
  71. ASSERT_MATCH(dsr::string_exclusiveRange(abcd, 0, 0), U""); // No size returns nothing
  72. ASSERT_MATCH(dsr::string_exclusiveRange(abcd, -670214452, 2), U"ab"); // Reading out of bound is clamped
  73. ASSERT_MATCH(dsr::string_exclusiveRange(abcd, 2, 985034841), U"cd"); // Reading out of bound is clamped
  74. ASSERT_MATCH(dsr::string_exclusiveRange(abcd, 4, 764), U""); // Completely ous of bound returns nothing
  75. ASSERT_MATCH(dsr::string_exclusiveRange(abcd, -631, 0), U""); // Completely ous of bound returns nothing
  76. }
  77. { // Processing
  78. dsr::String buffer = U"Garbage";
  79. ASSERT_MATCH(buffer, U"Garbage");
  80. buffer = foo(U"Ball", U"åäöÅÄÖ"); // Crash!
  81. ASSERT_MATCH(buffer, U"Foo(Ball,åäöÅÄÖ)"); // Failed
  82. fooInPlace(buffer, U"Å", U"ф");
  83. ASSERT_MATCH(buffer, U"Foo(Å,ф)");
  84. }
  85. { // Numbers
  86. uint32_t x = 0;
  87. int32_t y = -123456;
  88. int64_t z = 100200300400500600ULL;
  89. dsr::String values = dsr::string_combine(U"x = ", x, U", y = ", y, U", z = ", z);
  90. ASSERT_MATCH(values, U"x = 0, y = -123456, z = 100200300400500600");
  91. }
  92. { // Identifying numbers
  93. ASSERT_EQUAL(dsr::character_isDigit(U'0' - 1), false);
  94. ASSERT_EQUAL(dsr::character_isDigit(U'0'), true);
  95. ASSERT_EQUAL(dsr::character_isDigit(U'1'), true);
  96. ASSERT_EQUAL(dsr::character_isDigit(U'2'), true);
  97. ASSERT_EQUAL(dsr::character_isDigit(U'3'), true);
  98. ASSERT_EQUAL(dsr::character_isDigit(U'4'), true);
  99. ASSERT_EQUAL(dsr::character_isDigit(U'5'), true);
  100. ASSERT_EQUAL(dsr::character_isDigit(U'6'), true);
  101. ASSERT_EQUAL(dsr::character_isDigit(U'7'), true);
  102. ASSERT_EQUAL(dsr::character_isDigit(U'8'), true);
  103. ASSERT_EQUAL(dsr::character_isDigit(U'9'), true);
  104. ASSERT_EQUAL(dsr::character_isDigit(U'9' + 1), false);
  105. ASSERT_EQUAL(dsr::character_isDigit(U'a'), false);
  106. ASSERT_EQUAL(dsr::character_isDigit(U' '), false);
  107. ASSERT_EQUAL(dsr::character_isIntegerCharacter(U'-'), true);
  108. ASSERT_EQUAL(dsr::character_isIntegerCharacter(U'0' - 1), false);
  109. ASSERT_EQUAL(dsr::character_isIntegerCharacter(U'0'), true);
  110. ASSERT_EQUAL(dsr::character_isIntegerCharacter(U'9'), true);
  111. ASSERT_EQUAL(dsr::character_isIntegerCharacter(U'9' + 1), false);
  112. ASSERT_EQUAL(dsr::character_isIntegerCharacter(U'a'), false);
  113. ASSERT_EQUAL(dsr::character_isIntegerCharacter(U' '), false);
  114. ASSERT_EQUAL(dsr::character_isValueCharacter(U'-'), true);
  115. ASSERT_EQUAL(dsr::character_isValueCharacter(U'.'), true);
  116. ASSERT_EQUAL(dsr::character_isValueCharacter(U'0' - 1), false);
  117. ASSERT_EQUAL(dsr::character_isValueCharacter(U'0'), true);
  118. ASSERT_EQUAL(dsr::character_isValueCharacter(U'9'), true);
  119. ASSERT_EQUAL(dsr::character_isValueCharacter(U'9' + 1), false);
  120. ASSERT_EQUAL(dsr::character_isValueCharacter(U'a'), false);
  121. ASSERT_EQUAL(dsr::character_isValueCharacter(U' '), false);
  122. ASSERT_EQUAL(dsr::character_isWhiteSpace(U' '), true);
  123. ASSERT_EQUAL(dsr::character_isWhiteSpace(U'\t'), true);
  124. ASSERT_EQUAL(dsr::character_isWhiteSpace(U'\r'), true);
  125. ASSERT_EQUAL(dsr::character_isWhiteSpace(U'\0'), false);
  126. ASSERT_EQUAL(dsr::character_isWhiteSpace(U'a'), false);
  127. ASSERT_EQUAL(dsr::character_isWhiteSpace(U'1'), false);
  128. ASSERT_EQUAL(dsr::character_isWhiteSpace(U'('), false);
  129. ASSERT_EQUAL(dsr::character_isWhiteSpace(U')'), false);
  130. ASSERT_EQUAL(dsr::character_isWhiteSpace(U'.'), false);
  131. ASSERT_EQUAL(dsr::character_isWhiteSpace(U','), false);
  132. ASSERT_EQUAL(dsr::character_isWhiteSpace(U'-'), false);
  133. ASSERT_EQUAL(dsr::character_isWhiteSpace(U'_'), false);
  134. ASSERT_EQUAL(dsr::character_isWhiteSpace(U'|'), false);
  135. ASSERT_EQUAL(dsr::string_isInteger(U"0"), true);
  136. ASSERT_EQUAL(dsr::string_isInteger(U"1"), true);
  137. ASSERT_EQUAL(dsr::string_isInteger(U"-0"), true);
  138. ASSERT_EQUAL(dsr::string_isInteger(U"-1"), true);
  139. ASSERT_EQUAL(dsr::string_isInteger(U"0", false), true);
  140. ASSERT_EQUAL(dsr::string_isInteger(U" 0 "), true);
  141. ASSERT_EQUAL(dsr::string_isInteger(U" 0 ", false), false);
  142. ASSERT_EQUAL(dsr::string_isInteger(U" 123"), true);
  143. ASSERT_EQUAL(dsr::string_isInteger(U"-123"), true);
  144. ASSERT_EQUAL(dsr::string_isInteger(U""), false);
  145. ASSERT_EQUAL(dsr::string_isDouble(U"0"), true);
  146. ASSERT_EQUAL(dsr::string_isDouble(U"-0"), true);
  147. ASSERT_EQUAL(dsr::string_isDouble(U"1"), true);
  148. ASSERT_EQUAL(dsr::string_isDouble(U"-1"), true);
  149. ASSERT_EQUAL(dsr::string_isDouble(U"1.1"), true);
  150. ASSERT_EQUAL(dsr::string_isDouble(U"-1.1"), true);
  151. ASSERT_EQUAL(dsr::string_isDouble(U".1"), true);
  152. ASSERT_EQUAL(dsr::string_isDouble(U"-.1"), true);
  153. ASSERT_EQUAL(dsr::string_isDouble(U"0", false), true);
  154. ASSERT_EQUAL(dsr::string_isDouble(U" 0 "), true);
  155. ASSERT_EQUAL(dsr::string_isDouble(U" 0 ", false), false);
  156. ASSERT_EQUAL(dsr::string_isDouble(U" 123"), true);
  157. ASSERT_EQUAL(dsr::string_isDouble(U"-123"), true);
  158. ASSERT_EQUAL(dsr::string_isDouble(U"0.5"), true);
  159. ASSERT_EQUAL(dsr::string_isDouble(U"-0.5"), true);
  160. ASSERT_EQUAL(dsr::string_isDouble(U".5"), true);
  161. ASSERT_EQUAL(dsr::string_isDouble(U"-.5"), true);
  162. ASSERT_EQUAL(dsr::string_isDouble(U"0.54321"), true);
  163. ASSERT_EQUAL(dsr::string_isDouble(U"-0.54321"), true);
  164. ASSERT_EQUAL(dsr::string_isDouble(U""), false);
  165. }
  166. // Upper case
  167. ASSERT_MATCH(dsr::string_upperCase(U"a"), U"A");
  168. ASSERT_MATCH(dsr::string_upperCase(U"aB"), U"AB");
  169. ASSERT_MATCH(dsr::string_upperCase(U"abc"), U"ABC");
  170. ASSERT_MATCH(dsr::string_upperCase(U"abc1"), U"ABC1");
  171. ASSERT_MATCH(dsr::string_upperCase(U"Abc12"), U"ABC12");
  172. ASSERT_MATCH(dsr::string_upperCase(U"ABC123"), U"ABC123");
  173. // Lower case
  174. ASSERT_MATCH(dsr::string_lowerCase(U"a"), U"a");
  175. ASSERT_MATCH(dsr::string_lowerCase(U"aB"), U"ab");
  176. ASSERT_MATCH(dsr::string_lowerCase(U"abc"), U"abc");
  177. ASSERT_MATCH(dsr::string_lowerCase(U"abc1"), U"abc1");
  178. ASSERT_MATCH(dsr::string_lowerCase(U"Abc12"), U"abc12");
  179. ASSERT_MATCH(dsr::string_lowerCase(U"ABC123"), U"abc123");
  180. // White space removal by pointing to a section of the original input
  181. ASSERT_MATCH(dsr::string_removeOuterWhiteSpace(U" "), U"");
  182. ASSERT_MATCH(dsr::string_removeOuterWhiteSpace(U" abc "), U"abc");
  183. ASSERT_MATCH(dsr::string_removeOuterWhiteSpace(U" two words "), U"two words");
  184. ASSERT_MATCH(dsr::string_removeOuterWhiteSpace(U" \" something quoted \" "), U"\" something quoted \"");
  185. // Quote mangling
  186. ASSERT_MATCH(dsr::string_mangleQuote(U""), U"\"\"");
  187. ASSERT_MATCH(dsr::string_mangleQuote(U"1"), U"\"1\"");
  188. ASSERT_MATCH(dsr::string_mangleQuote(U"12"), U"\"12\"");
  189. ASSERT_MATCH(dsr::string_mangleQuote(U"123"), U"\"123\"");
  190. ASSERT_MATCH(dsr::string_mangleQuote(U"abc"), U"\"abc\"");
  191. // Not enough quote signs
  192. ASSERT_CRASH(dsr::string_unmangleQuote(U""));
  193. ASSERT_CRASH(dsr::string_unmangleQuote(U" "));
  194. ASSERT_CRASH(dsr::string_unmangleQuote(U"ab\"cd"));
  195. // Too many quote signs
  196. ASSERT_CRASH(dsr::string_unmangleQuote(U"ab\"cd\"ef\"gh"));
  197. // Basic quote
  198. ASSERT_MATCH(dsr::string_unmangleQuote(U"\"ab\""), U"ab");
  199. // Surrounded quote
  200. ASSERT_MATCH(dsr::string_unmangleQuote(U"\"ab\"cd"), U"ab");
  201. ASSERT_MATCH(dsr::string_unmangleQuote(U"ab\"cd\""), U"cd");
  202. ASSERT_MATCH(dsr::string_unmangleQuote(U"ab\"cd\"ef"), U"cd");
  203. // Mangled quote inside of quote
  204. ASSERT_MATCH(dsr::string_unmangleQuote(U"ab\"c\\\"d\"ef"), U"c\"d");
  205. ASSERT_MATCH(dsr::string_unmangleQuote(dsr::string_mangleQuote(U"c\"d")), U"c\"d");
  206. // Mangle things
  207. dsr::String randomText;
  208. string_reserve(randomText, 100);
  209. for (int i = 1; i < 100; i++) {
  210. // Randomize previous characters
  211. for (int j = 1; j < i - 1; j++) {
  212. string_appendChar(randomText, (DsrChar)((i * 21 + j * 49 + 136) % 1024));
  213. }
  214. // Add a new random character
  215. string_appendChar(randomText, (i * 21 + 136) % 256);
  216. ASSERT_MATCH(dsr::string_unmangleQuote(dsr::string_mangleQuote(randomText)), randomText);
  217. }
  218. // Number serialization
  219. ASSERT_MATCH(dsr::string_combine(0, U" ", 1), U"0 1");
  220. ASSERT_MATCH(dsr::string_combine(14, U"x", 135), U"14x135");
  221. ASSERT_MATCH(dsr::string_combine(-135), U"-135");
  222. ASSERT_MATCH(dsr::string_combine(-14), U"-14");
  223. ASSERT_MATCH(dsr::string_combine(-1), U"-1");
  224. ASSERT_MATCH(dsr::string_combine(0u), U"0");
  225. ASSERT_MATCH(dsr::string_combine(1u), U"1");
  226. ASSERT_MATCH(dsr::string_combine(14u), U"14");
  227. ASSERT_MATCH(dsr::string_combine(135u), U"135");
  228. // Number parsing
  229. ASSERT_EQUAL(string_toInteger(U"0"), 0);
  230. ASSERT_EQUAL(string_toInteger(U"-0"), 0);
  231. ASSERT_EQUAL(string_toInteger(U"No digits here."), 0);
  232. ASSERT_EQUAL(string_toInteger(U" (12 garbage 34) "), 1234); // You are supposed to catch these errors before converting to an integer
  233. ASSERT_EQUAL(string_toInteger(U""), 0);
  234. ASSERT_EQUAL(string_toInteger(U"1"), 1);
  235. ASSERT_EQUAL(string_toInteger(U"-1"), -1);
  236. ASSERT_EQUAL(string_toInteger(U"1024"), 1024);
  237. ASSERT_EQUAL(string_toInteger(U"-1024"), -1024);
  238. ASSERT_EQUAL(string_toInteger(U"1000000"), 1000000);
  239. ASSERT_EQUAL(string_toInteger(U"-1000000"), -1000000);
  240. ASSERT_EQUAL(string_toInteger(U"123"), 123);
  241. ASSERT_EQUAL(string_toDouble(U"123"), 123.0);
  242. ASSERT_EQUAL(string_toDouble(U"123.456"), 123.456);
  243. { // Assigning strings using reference counting
  244. String a = U"Some text";
  245. ASSERT_EQUAL(string_getBufferUseCount(a), 1);
  246. String b = a;
  247. ASSERT_EQUAL(string_getBufferUseCount(a), 2);
  248. ASSERT_EQUAL(string_getBufferUseCount(b), 2);
  249. String c = b;
  250. ASSERT_EQUAL(string_getBufferUseCount(a), 3);
  251. ASSERT_EQUAL(string_getBufferUseCount(b), 3);
  252. ASSERT_EQUAL(string_getBufferUseCount(c), 3);
  253. }
  254. { // String splitting by shared reference counted buffer
  255. String source = U"a . b . c . d";
  256. List<String> result;
  257. result = string_split(source, U'.', false);
  258. ASSERT_EQUAL(string_getBufferUseCount(source), 1);
  259. ASSERT_EQUAL(result.length(), 4);
  260. ASSERT_MATCH(result[0], U"a ");
  261. ASSERT_MATCH(result[1], U" b ");
  262. ASSERT_MATCH(result[2], U" c ");
  263. ASSERT_MATCH(result[3], U" d");
  264. //ASSERT_EQUAL(string_getBufferUseCount(source), 5);
  265. result = string_split(U"a . b .\tc", U'.', true);
  266. ASSERT_EQUAL(result.length(), 3);
  267. ASSERT_MATCH(result[0], U"a");
  268. ASSERT_MATCH(result[1], U"b");
  269. ASSERT_MATCH(result[2], U"c");
  270. //ASSERT_EQUAL(string_getBufferUseCount(source), 4);
  271. }
  272. { // Callback splitting
  273. String numbers = U"1, 3, 5, 7, 9";
  274. List<int> result;
  275. string_split_callback([&numbers, &result](ReadableString section) {
  276. result.push(string_toInteger(section));
  277. }, numbers, U',');
  278. ASSERT_EQUAL(result.length(), 5);
  279. ASSERT_EQUAL(result[0], 1);
  280. ASSERT_EQUAL(result[1], 3);
  281. ASSERT_EQUAL(result[2], 5);
  282. ASSERT_EQUAL(result[3], 7);
  283. ASSERT_EQUAL(result[4], 9);
  284. }
  285. // TODO: Test taking a part of a parent string with a start offset, leaving the parent scope,
  286. // and expanding with append while the buffer isn't shared but has an offset from buffer start.
  287. // TODO: Test sharing the same buffer between strings, then clear and append more text without overwriting other strings.
  288. // TODO: Assert that buffers are shared when they should, but prevents side-effects when one is being written to.
  289. END_TEST