StringTest.cpp 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291
  1. #include "../testTools.h"
  2. // TODO: Cannot use casting to parent type at the same time as automatic conversion from const char*
  3. // Cover everything using a single dsr::String type?
  4. // Use "" operand as only constructor?
  5. void fooInPlace(dsr::String& target, const dsr::ReadableString& a, const dsr::ReadableString& b) {
  6. target.clear();
  7. target.append(U"Foo(");
  8. target.append(a);
  9. target.appendChar(U',');
  10. target.append(b);
  11. target.appendChar(U')');
  12. }
  13. dsr::String foo(const dsr::ReadableString& a, const dsr::ReadableString& b) {
  14. dsr::String result;
  15. result.reserve(string_length(a) + string_length(b) + 6);
  16. fooInPlace(result, a, b);
  17. return result;
  18. }
  19. START_TEST(String)
  20. { // Length
  21. ASSERT_EQUAL(string_length(dsr::String()), 0);
  22. ASSERT_EQUAL(string_length(U""), 0);
  23. ASSERT_EQUAL(string_length(U"a"), 1);
  24. ASSERT_EQUAL(string_length(U"ab"), 2);
  25. ASSERT_EQUAL(string_length(U"abc"), 3);
  26. ASSERT_EQUAL(string_length(U"0123456789"), 10);
  27. }
  28. { // Reading characters
  29. ASSERT_EQUAL(dsr::ReadableString(U"ABC")[0], U'A');
  30. ASSERT_EQUAL(dsr::ReadableString(U"ABC")[1], U'B');
  31. ASSERT_EQUAL(dsr::ReadableString(U"ABC")[2], U'C');
  32. ASSERT_EQUAL(dsr::ReadableString(U"ABC")[3], U'\0');
  33. ASSERT_EQUAL(dsr::ReadableString(U"ABC")[10], U'\0');
  34. ASSERT_EQUAL(dsr::ReadableString(U"ABC")[1000000], U'\0');
  35. ASSERT_EQUAL(dsr::ReadableString(U"ABC")[-1], U'\0');
  36. ASSERT_EQUAL(dsr::ReadableString(U"ABC")[-1000000], U'\0');
  37. ASSERT_EQUAL(dsr::ReadableString(U"")[-1], U'\0');
  38. ASSERT_EQUAL(dsr::ReadableString(U"")[0], U'\0');
  39. ASSERT_EQUAL(dsr::ReadableString(U"")[1], U'\0');
  40. }
  41. { // Comparison
  42. dsr::ReadableString litA = U"Testing \u0444";
  43. dsr::ReadableString litB = U"Testing ф";
  44. ASSERT(string_match(litA, litB));
  45. ASSERT(!string_match(litA, U"wrong"));
  46. ASSERT(!string_match(U"wrong", litB));
  47. ASSERT(dsr::string_caseInsensitiveMatch(U"abc 123!", U"ABC 123!"));
  48. ASSERT(!dsr::string_caseInsensitiveMatch(U"abc 123!", U"ABD 123!"));
  49. ASSERT(dsr::string_match(U"aBc 123!", U"aBc 123!"));
  50. ASSERT(!dsr::string_match(U"abc 123!", U"ABC 123!"));
  51. }
  52. { // Concatenation
  53. dsr::String ab = dsr::string_combine(U"a", U"b");
  54. ASSERT_MATCH(ab, U"ab");
  55. dsr::String cd = dsr::string_combine(U"c", U"d");
  56. ASSERT_MATCH(cd, U"cd");
  57. cd = dsr::string_combine(U"c", U"d");
  58. ASSERT_MATCH(cd, U"cd");
  59. auto abcd = ab + cd;
  60. ASSERT_MATCH(abcd, U"abcd");
  61. ASSERT_MATCH(dsr::string_combine(U"a", U"b", U"c", "d"), U"abcd");
  62. }
  63. { // Sub-strings
  64. dsr::ReadableString abcd = U"abcd";
  65. dsr::String efgh = U"efgh";
  66. ASSERT_MATCH(dsr::string_inclusiveRange(abcd, 0, 3), U"abcd");
  67. ASSERT_MATCH(dsr::string_exclusiveRange(abcd, 1, 2), U"b");
  68. ASSERT_MATCH(dsr::string_inclusiveRange(efgh, 2, 3), U"gh");
  69. ASSERT_MATCH(dsr::string_exclusiveRange(efgh, 3, 4), U"h");
  70. ASSERT_MATCH(dsr::string_combine(string_from(abcd, 2), string_before(efgh, 2)), U"cdef");
  71. ASSERT_MATCH(dsr::string_exclusiveRange(abcd, 0, 0), U""); // No size returns nothing
  72. ASSERT_MATCH(dsr::string_exclusiveRange(abcd, -1, -2), U""); // A negative size doesn't have to be inside
  73. ASSERT_CRASH(dsr::string_inclusiveRange(abcd, -1, -1)); // Index below bound expected
  74. ASSERT_CRASH(dsr::string_inclusiveRange(abcd, 4, 4)); // Index above bound expected
  75. }
  76. { // Processing
  77. dsr::String buffer = U"Garbage";
  78. ASSERT_MATCH(buffer, U"Garbage");
  79. buffer = foo(U"Ball", U"åäöÅÄÖ"); // Crash!
  80. ASSERT_MATCH(buffer, U"Foo(Ball,åäöÅÄÖ)"); // Failed
  81. fooInPlace(buffer, U"Å", U"ф");
  82. ASSERT_MATCH(buffer, U"Foo(Å,ф)");
  83. }
  84. { // Numbers
  85. uint32_t x = 0;
  86. int32_t y = -123456;
  87. int64_t z = 100200300400500600ULL;
  88. dsr::String values = dsr::string_combine(U"x = ", x, U", y = ", y, U", z = ", z);
  89. ASSERT_MATCH(values, U"x = 0, y = -123456, z = 100200300400500600");
  90. }
  91. { // Identifying numbers
  92. ASSERT_EQUAL(dsr::character_isDigit(U'0' - 1), false);
  93. ASSERT_EQUAL(dsr::character_isDigit(U'0'), true);
  94. ASSERT_EQUAL(dsr::character_isDigit(U'1'), true);
  95. ASSERT_EQUAL(dsr::character_isDigit(U'2'), true);
  96. ASSERT_EQUAL(dsr::character_isDigit(U'3'), true);
  97. ASSERT_EQUAL(dsr::character_isDigit(U'4'), true);
  98. ASSERT_EQUAL(dsr::character_isDigit(U'5'), true);
  99. ASSERT_EQUAL(dsr::character_isDigit(U'6'), true);
  100. ASSERT_EQUAL(dsr::character_isDigit(U'7'), true);
  101. ASSERT_EQUAL(dsr::character_isDigit(U'8'), true);
  102. ASSERT_EQUAL(dsr::character_isDigit(U'9'), true);
  103. ASSERT_EQUAL(dsr::character_isDigit(U'9' + 1), false);
  104. ASSERT_EQUAL(dsr::character_isDigit(U'a'), false);
  105. ASSERT_EQUAL(dsr::character_isDigit(U' '), false);
  106. ASSERT_EQUAL(dsr::character_isIntegerCharacter(U'-'), true);
  107. ASSERT_EQUAL(dsr::character_isIntegerCharacter(U'0' - 1), false);
  108. ASSERT_EQUAL(dsr::character_isIntegerCharacter(U'0'), true);
  109. ASSERT_EQUAL(dsr::character_isIntegerCharacter(U'9'), true);
  110. ASSERT_EQUAL(dsr::character_isIntegerCharacter(U'9' + 1), false);
  111. ASSERT_EQUAL(dsr::character_isIntegerCharacter(U'a'), false);
  112. ASSERT_EQUAL(dsr::character_isIntegerCharacter(U' '), false);
  113. ASSERT_EQUAL(dsr::character_isValueCharacter(U'-'), true);
  114. ASSERT_EQUAL(dsr::character_isValueCharacter(U'.'), true);
  115. ASSERT_EQUAL(dsr::character_isValueCharacter(U'0' - 1), false);
  116. ASSERT_EQUAL(dsr::character_isValueCharacter(U'0'), true);
  117. ASSERT_EQUAL(dsr::character_isValueCharacter(U'9'), true);
  118. ASSERT_EQUAL(dsr::character_isValueCharacter(U'9' + 1), false);
  119. ASSERT_EQUAL(dsr::character_isValueCharacter(U'a'), false);
  120. ASSERT_EQUAL(dsr::character_isValueCharacter(U' '), false);
  121. ASSERT_EQUAL(dsr::character_isWhiteSpace(U' '), true);
  122. ASSERT_EQUAL(dsr::character_isWhiteSpace(U'\t'), true);
  123. ASSERT_EQUAL(dsr::character_isWhiteSpace(U'\r'), true);
  124. ASSERT_EQUAL(dsr::character_isWhiteSpace(U'\0'), false);
  125. ASSERT_EQUAL(dsr::character_isWhiteSpace(U'a'), false);
  126. ASSERT_EQUAL(dsr::character_isWhiteSpace(U'1'), false);
  127. ASSERT_EQUAL(dsr::character_isWhiteSpace(U'('), false);
  128. ASSERT_EQUAL(dsr::character_isWhiteSpace(U')'), false);
  129. ASSERT_EQUAL(dsr::character_isWhiteSpace(U'.'), false);
  130. ASSERT_EQUAL(dsr::character_isWhiteSpace(U','), false);
  131. ASSERT_EQUAL(dsr::character_isWhiteSpace(U'-'), false);
  132. ASSERT_EQUAL(dsr::character_isWhiteSpace(U'_'), false);
  133. ASSERT_EQUAL(dsr::character_isWhiteSpace(U'|'), false);
  134. ASSERT_EQUAL(dsr::string_isInteger(U"0"), true);
  135. ASSERT_EQUAL(dsr::string_isInteger(U"1"), true);
  136. ASSERT_EQUAL(dsr::string_isInteger(U"-0"), true);
  137. ASSERT_EQUAL(dsr::string_isInteger(U"-1"), true);
  138. ASSERT_EQUAL(dsr::string_isInteger(U"0", false), true);
  139. ASSERT_EQUAL(dsr::string_isInteger(U" 0 "), true);
  140. ASSERT_EQUAL(dsr::string_isInteger(U" 0 ", false), false);
  141. ASSERT_EQUAL(dsr::string_isInteger(U" 123"), true);
  142. ASSERT_EQUAL(dsr::string_isInteger(U"-123"), true);
  143. ASSERT_EQUAL(dsr::string_isInteger(U""), false);
  144. ASSERT_EQUAL(dsr::string_isDouble(U"0"), true);
  145. ASSERT_EQUAL(dsr::string_isDouble(U"-0"), true);
  146. ASSERT_EQUAL(dsr::string_isDouble(U"1"), true);
  147. ASSERT_EQUAL(dsr::string_isDouble(U"-1"), true);
  148. ASSERT_EQUAL(dsr::string_isDouble(U"1.1"), true);
  149. ASSERT_EQUAL(dsr::string_isDouble(U"-1.1"), true);
  150. ASSERT_EQUAL(dsr::string_isDouble(U".1"), true);
  151. ASSERT_EQUAL(dsr::string_isDouble(U"-.1"), true);
  152. ASSERT_EQUAL(dsr::string_isDouble(U"0", false), true);
  153. ASSERT_EQUAL(dsr::string_isDouble(U" 0 "), true);
  154. ASSERT_EQUAL(dsr::string_isDouble(U" 0 ", false), false);
  155. ASSERT_EQUAL(dsr::string_isDouble(U" 123"), true);
  156. ASSERT_EQUAL(dsr::string_isDouble(U"-123"), true);
  157. ASSERT_EQUAL(dsr::string_isDouble(U"0.5"), true);
  158. ASSERT_EQUAL(dsr::string_isDouble(U"-0.5"), true);
  159. ASSERT_EQUAL(dsr::string_isDouble(U".5"), true);
  160. ASSERT_EQUAL(dsr::string_isDouble(U"-.5"), true);
  161. ASSERT_EQUAL(dsr::string_isDouble(U"0.54321"), true);
  162. ASSERT_EQUAL(dsr::string_isDouble(U"-0.54321"), true);
  163. ASSERT_EQUAL(dsr::string_isDouble(U""), false);
  164. }
  165. // Upper case
  166. ASSERT_MATCH(dsr::string_upperCase(U"a"), U"A");
  167. ASSERT_MATCH(dsr::string_upperCase(U"aB"), U"AB");
  168. ASSERT_MATCH(dsr::string_upperCase(U"abc"), U"ABC");
  169. ASSERT_MATCH(dsr::string_upperCase(U"abc1"), U"ABC1");
  170. ASSERT_MATCH(dsr::string_upperCase(U"Abc12"), U"ABC12");
  171. ASSERT_MATCH(dsr::string_upperCase(U"ABC123"), U"ABC123");
  172. // Lower case
  173. ASSERT_MATCH(dsr::string_lowerCase(U"a"), U"a");
  174. ASSERT_MATCH(dsr::string_lowerCase(U"aB"), U"ab");
  175. ASSERT_MATCH(dsr::string_lowerCase(U"abc"), U"abc");
  176. ASSERT_MATCH(dsr::string_lowerCase(U"abc1"), U"abc1");
  177. ASSERT_MATCH(dsr::string_lowerCase(U"Abc12"), U"abc12");
  178. ASSERT_MATCH(dsr::string_lowerCase(U"ABC123"), U"abc123");
  179. // Complete white space removal
  180. ASSERT_MATCH(dsr::string_removeAllWhiteSpace(U" "), U"");
  181. ASSERT_MATCH(dsr::string_removeAllWhiteSpace(U" abc\n "), U"abc");
  182. ASSERT_MATCH(dsr::string_removeAllWhiteSpace(U" a \f sentence \r surrounded \n by spa\vce \t"), U"asentencesurroundedbyspace");
  183. // White space removal by pointing to a section of the original input
  184. ASSERT_MATCH(dsr::string_removeOuterWhiteSpace(U" "), U"");
  185. ASSERT_MATCH(dsr::string_removeOuterWhiteSpace(U" abc "), U"abc");
  186. ASSERT_MATCH(dsr::string_removeOuterWhiteSpace(U" two words "), U"two words");
  187. ASSERT_MATCH(dsr::string_removeOuterWhiteSpace(U" \" something quoted \" "), U"\" something quoted \"");
  188. // Quote mangling
  189. ASSERT_MATCH(dsr::string_mangleQuote(U""), U"\"\"");
  190. ASSERT_MATCH(dsr::string_mangleQuote(U"1"), U"\"1\"");
  191. ASSERT_MATCH(dsr::string_mangleQuote(U"12"), U"\"12\"");
  192. ASSERT_MATCH(dsr::string_mangleQuote(U"123"), U"\"123\"");
  193. ASSERT_MATCH(dsr::string_mangleQuote(U"abc"), U"\"abc\"");
  194. // Not enough quote signs
  195. ASSERT_CRASH(dsr::string_unmangleQuote(U""));
  196. ASSERT_CRASH(dsr::string_unmangleQuote(U" "));
  197. ASSERT_CRASH(dsr::string_unmangleQuote(U"ab\"cd"));
  198. // Too many quote signs
  199. ASSERT_CRASH(dsr::string_unmangleQuote(U"ab\"cd\"ef\"gh"));
  200. // Basic quote
  201. ASSERT_MATCH(dsr::string_unmangleQuote(U"\"ab\""), U"ab");
  202. // Surrounded quote
  203. ASSERT_MATCH(dsr::string_unmangleQuote(U"\"ab\"cd"), U"ab");
  204. ASSERT_MATCH(dsr::string_unmangleQuote(U"ab\"cd\""), U"cd");
  205. ASSERT_MATCH(dsr::string_unmangleQuote(U"ab\"cd\"ef"), U"cd");
  206. // Mangled quote inside of quote
  207. ASSERT_MATCH(dsr::string_unmangleQuote(U"ab\"c\\\"d\"ef"), U"c\"d");
  208. ASSERT_MATCH(dsr::string_unmangleQuote(dsr::string_mangleQuote(U"c\"d")), U"c\"d");
  209. // Mangle things
  210. dsr::String randomText;
  211. for (int i = 1; i < 100; i++) {
  212. // Randomize previous characters
  213. for (int j = 1; j < i - 1; j++) {
  214. randomText.write(j, (DsrChar)((i * 21 + j * 49 + 136) % 1024));
  215. }
  216. // Add a new random character
  217. randomText.appendChar((i * 21 + 136) % 256);
  218. ASSERT_MATCH(dsr::string_unmangleQuote(dsr::string_mangleQuote(randomText)), randomText);
  219. }
  220. // Number serialization
  221. ASSERT_MATCH(dsr::string_combine(0, U" ", 1), U"0 1");
  222. ASSERT_MATCH(dsr::string_combine(14, U"x", 135), U"14x135");
  223. ASSERT_MATCH(dsr::string_combine(-135), U"-135");
  224. ASSERT_MATCH(dsr::string_combine(-14), U"-14");
  225. ASSERT_MATCH(dsr::string_combine(-1), U"-1");
  226. ASSERT_MATCH(dsr::string_combine(0u), U"0");
  227. ASSERT_MATCH(dsr::string_combine(1u), U"1");
  228. ASSERT_MATCH(dsr::string_combine(14u), U"14");
  229. ASSERT_MATCH(dsr::string_combine(135u), U"135");
  230. // Number parsing
  231. ASSERT_EQUAL(string_toInteger(U"0"), 0);
  232. ASSERT_EQUAL(string_toInteger(U"-0"), 0);
  233. ASSERT_EQUAL(string_toInteger(U"No digits here."), 0);
  234. ASSERT_EQUAL(string_toInteger(U" (12 garbage 34) "), 1234); // You are supposed to catch these errors before converting to an integer
  235. ASSERT_EQUAL(string_toInteger(U""), 0);
  236. ASSERT_EQUAL(string_toInteger(U"1"), 1);
  237. ASSERT_EQUAL(string_toInteger(U"-1"), -1);
  238. ASSERT_EQUAL(string_toInteger(U"1024"), 1024);
  239. ASSERT_EQUAL(string_toInteger(U"-1024"), -1024);
  240. ASSERT_EQUAL(string_toInteger(U"1000000"), 1000000);
  241. ASSERT_EQUAL(string_toInteger(U"-1000000"), -1000000);
  242. ASSERT_EQUAL(string_toInteger(U"123"), 123);
  243. ASSERT_EQUAL(string_toDouble(U"123"), 123.0);
  244. ASSERT_EQUAL(string_toDouble(U"123.456"), 123.456);
  245. { // Splitting
  246. List<ReadableString> result;
  247. string_split_inPlace(result, U"a.b.c.d", U'.');
  248. ASSERT_EQUAL(result.length(), 4);
  249. ASSERT_MATCH(result[0], U"a");
  250. ASSERT_MATCH(result[1], U"b");
  251. ASSERT_MATCH(result[2], U"c");
  252. ASSERT_MATCH(result[3], U"d");
  253. String content = U"One Two Three";
  254. result = string_split(content, U' ');
  255. ASSERT_EQUAL(result.length(), 3);
  256. ASSERT_MATCH(result[0], U"One");
  257. ASSERT_MATCH(result[1], U"Two");
  258. ASSERT_MATCH(result[2], U"Three");
  259. string_split_inPlace(result, U"Four.Five", U'.', true);
  260. ASSERT_EQUAL(result.length(), 5);
  261. ASSERT_MATCH(result[0], U"One");
  262. ASSERT_MATCH(result[1], U"Two");
  263. ASSERT_MATCH(result[2], U"Three");
  264. ASSERT_MATCH(result[3], U"Four");
  265. ASSERT_MATCH(result[4], U"Five");
  266. string_split_inPlace(result, U" 1 | 2 ", U'|');
  267. ASSERT_EQUAL(result.length(), 2);
  268. ASSERT_MATCH(result[0], U" 1 ");
  269. ASSERT_MATCH(result[1], U" 2 ");
  270. }
  271. { // Callback splitting
  272. String numbers = U"1, 3, 5, 7, 9";
  273. List<int> result;
  274. string_split_callback([&numbers, &result](ReadableString section) {
  275. result.push(string_toInteger(section));
  276. }, numbers, U',');
  277. ASSERT_EQUAL(result.length(), 5);
  278. ASSERT_EQUAL(result[0], 1);
  279. ASSERT_EQUAL(result[1], 3);
  280. ASSERT_EQUAL(result[2], 5);
  281. ASSERT_EQUAL(result[3], 7);
  282. ASSERT_EQUAL(result[4], 9);
  283. }
  284. // TODO: Test taking a part of a parent string with a start offset, leaving the parent scope,
  285. // and expanding with append while the buffer isn't shared but has an offset from buffer start.
  286. // TODO: Assert that buffers are shared when they should, but prevents side-effects when one is being written to.
  287. END_TEST