strings.lua 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379
  1. -- $Id: strings.lua,v 1.87 2016/12/21 19:23:02 roberto Exp $
  2. -- See Copyright Notice in file all.lua
  3. print('testing strings and string library')
  4. local maxi, mini = math.maxinteger, math.mininteger
  5. local function checkerror (msg, f, ...)
  6. local s, err = pcall(f, ...)
  7. assert(not s and string.find(err, msg))
  8. end
  9. -- testing string comparisons
  10. assert('alo' < 'alo1')
  11. assert('' < 'a')
  12. assert('alo\0alo' < 'alo\0b')
  13. assert('alo\0alo\0\0' > 'alo\0alo\0')
  14. assert('alo' < 'alo\0')
  15. assert('alo\0' > 'alo')
  16. assert('\0' < '\1')
  17. assert('\0\0' < '\0\1')
  18. assert('\1\0a\0a' <= '\1\0a\0a')
  19. assert(not ('\1\0a\0b' <= '\1\0a\0a'))
  20. assert('\0\0\0' < '\0\0\0\0')
  21. assert(not('\0\0\0\0' < '\0\0\0'))
  22. assert('\0\0\0' <= '\0\0\0\0')
  23. assert(not('\0\0\0\0' <= '\0\0\0'))
  24. assert('\0\0\0' <= '\0\0\0')
  25. assert('\0\0\0' >= '\0\0\0')
  26. assert(not ('\0\0b' < '\0\0a\0'))
  27. -- testing string.sub
  28. assert(string.sub("123456789",2,4) == "234")
  29. assert(string.sub("123456789",7) == "789")
  30. assert(string.sub("123456789",7,6) == "")
  31. assert(string.sub("123456789",7,7) == "7")
  32. assert(string.sub("123456789",0,0) == "")
  33. assert(string.sub("123456789",-10,10) == "123456789")
  34. assert(string.sub("123456789",1,9) == "123456789")
  35. assert(string.sub("123456789",-10,-20) == "")
  36. assert(string.sub("123456789",-1) == "9")
  37. assert(string.sub("123456789",-4) == "6789")
  38. assert(string.sub("123456789",-6, -4) == "456")
  39. assert(string.sub("123456789", mini, -4) == "123456")
  40. assert(string.sub("123456789", mini, maxi) == "123456789")
  41. assert(string.sub("123456789", mini, mini) == "")
  42. assert(string.sub("\000123456789",3,5) == "234")
  43. assert(("\000123456789"):sub(8) == "789")
  44. -- testing string.find
  45. assert(string.find("123456789", "345") == 3)
  46. a,b = string.find("123456789", "345")
  47. assert(string.sub("123456789", a, b) == "345")
  48. assert(string.find("1234567890123456789", "345", 3) == 3)
  49. assert(string.find("1234567890123456789", "345", 4) == 13)
  50. assert(string.find("1234567890123456789", "346", 4) == nil)
  51. assert(string.find("1234567890123456789", ".45", -9) == 13)
  52. assert(string.find("abcdefg", "\0", 5, 1) == nil)
  53. assert(string.find("", "") == 1)
  54. assert(string.find("", "", 1) == 1)
  55. assert(not string.find("", "", 2))
  56. assert(string.find('', 'aaa', 1) == nil)
  57. assert(('alo(.)alo'):find('(.)', 1, 1) == 4)
  58. assert(string.len("") == 0)
  59. assert(string.len("\0\0\0") == 3)
  60. assert(string.len("1234567890") == 10)
  61. assert(#"" == 0)
  62. assert(#"\0\0\0" == 3)
  63. assert(#"1234567890" == 10)
  64. -- testing string.byte/string.char
  65. assert(string.byte("a") == 97)
  66. assert(string.byte("\xe4") > 127)
  67. assert(string.byte(string.char(255)) == 255)
  68. assert(string.byte(string.char(0)) == 0)
  69. assert(string.byte("\0") == 0)
  70. assert(string.byte("\0\0alo\0x", -1) == string.byte('x'))
  71. assert(string.byte("ba", 2) == 97)
  72. assert(string.byte("\n\n", 2, -1) == 10)
  73. assert(string.byte("\n\n", 2, 2) == 10)
  74. assert(string.byte("") == nil)
  75. assert(string.byte("hi", -3) == nil)
  76. assert(string.byte("hi", 3) == nil)
  77. assert(string.byte("hi", 9, 10) == nil)
  78. assert(string.byte("hi", 2, 1) == nil)
  79. assert(string.char() == "")
  80. assert(string.char(0, 255, 0) == "\0\255\0")
  81. assert(string.char(0, string.byte("\xe4"), 0) == "\0\xe4\0")
  82. assert(string.char(string.byte("\xe4l\0óu", 1, -1)) == "\xe4l\0óu")
  83. assert(string.char(string.byte("\xe4l\0óu", 1, 0)) == "")
  84. assert(string.char(string.byte("\xe4l\0óu", -10, 100)) == "\xe4l\0óu")
  85. assert(string.upper("ab\0c") == "AB\0C")
  86. assert(string.lower("\0ABCc%$") == "\0abcc%$")
  87. assert(string.rep('teste', 0) == '')
  88. assert(string.rep('tés\00tê', 2) == 'tés\0têtés\000tê')
  89. assert(string.rep('', 10) == '')
  90. if string.packsize("i") == 4 then
  91. -- result length would be 2^31 (int overflow)
  92. checkerror("too large", string.rep, 'aa', (1 << 30))
  93. checkerror("too large", string.rep, 'a', (1 << 30), ',')
  94. end
  95. -- repetitions with separator
  96. assert(string.rep('teste', 0, 'xuxu') == '')
  97. assert(string.rep('teste', 1, 'xuxu') == 'teste')
  98. assert(string.rep('\1\0\1', 2, '\0\0') == '\1\0\1\0\0\1\0\1')
  99. assert(string.rep('', 10, '.') == string.rep('.', 9))
  100. assert(not pcall(string.rep, "aa", maxi // 2 + 10))
  101. assert(not pcall(string.rep, "", maxi // 2 + 10, "aa"))
  102. assert(string.reverse"" == "")
  103. assert(string.reverse"\0\1\2\3" == "\3\2\1\0")
  104. assert(string.reverse"\0001234" == "4321\0")
  105. for i=0,30 do assert(string.len(string.rep('a', i)) == i) end
  106. assert(type(tostring(nil)) == 'string')
  107. assert(type(tostring(12)) == 'string')
  108. assert(string.find(tostring{}, 'table:'))
  109. assert(string.find(tostring(print), 'function:'))
  110. assert(#tostring('\0') == 1)
  111. assert(tostring(true) == "true")
  112. assert(tostring(false) == "false")
  113. assert(tostring(-1203) == "-1203")
  114. assert(tostring(1203.125) == "1203.125")
  115. assert(tostring(-0.5) == "-0.5")
  116. assert(tostring(-32767) == "-32767")
  117. if math.tointeger(2147483647) then -- no overflow? (32 bits)
  118. assert(tostring(-2147483647) == "-2147483647")
  119. end
  120. if math.tointeger(4611686018427387904) then -- no overflow? (64 bits)
  121. assert(tostring(4611686018427387904) == "4611686018427387904")
  122. assert(tostring(-4611686018427387904) == "-4611686018427387904")
  123. end
  124. if tostring(0.0) == "0.0" then -- "standard" coercion float->string
  125. assert('' .. 12 == '12' and 12.0 .. '' == '12.0')
  126. assert(tostring(-1203 + 0.0) == "-1203.0")
  127. else -- compatible coercion
  128. assert(tostring(0.0) == "0")
  129. assert('' .. 12 == '12' and 12.0 .. '' == '12')
  130. assert(tostring(-1203 + 0.0) == "-1203")
  131. end
  132. x = '"ílo"\n\\'
  133. assert(string.format('%q%s', x, x) == '"\\"ílo\\"\\\n\\\\""ílo"\n\\')
  134. assert(string.format('%q', "\0") == [["\0"]])
  135. assert(load(string.format('return %q', x))() == x)
  136. x = "\0\1\0023\5\0009"
  137. assert(load(string.format('return %q', x))() == x)
  138. assert(string.format("\0%c\0%c%x\0", string.byte("\xe4"), string.byte("b"), 140) ==
  139. "\0\xe4\0b8c\0")
  140. assert(string.format('') == "")
  141. assert(string.format("%c",34)..string.format("%c",48)..string.format("%c",90)..string.format("%c",100) ==
  142. string.format("%c%c%c%c", 34, 48, 90, 100))
  143. assert(string.format("%s\0 is not \0%s", 'not be', 'be') == 'not be\0 is not \0be')
  144. assert(string.format("%%%d %010d", 10, 23) == "%10 0000000023")
  145. assert(tonumber(string.format("%f", 10.3)) == 10.3)
  146. x = string.format('"%-50s"', 'a')
  147. assert(#x == 52)
  148. assert(string.sub(x, 1, 4) == '"a ')
  149. assert(string.format("-%.20s.20s", string.rep("%", 2000)) ==
  150. "-"..string.rep("%", 20)..".20s")
  151. assert(string.format('"-%20s.20s"', string.rep("%", 2000)) ==
  152. string.format("%q", "-"..string.rep("%", 2000)..".20s"))
  153. do
  154. local function checkQ (v)
  155. local s = string.format("%q", v)
  156. local nv = load("return " .. s)()
  157. assert(v == nv and math.type(v) == math.type(nv))
  158. end
  159. checkQ("\0\0\1\255\u{234}")
  160. checkQ(math.maxinteger)
  161. checkQ(math.mininteger)
  162. checkQ(math.pi)
  163. checkQ(0.1)
  164. checkQ(true)
  165. checkQ(nil)
  166. checkQ(false)
  167. checkerror("no literal", string.format, "%q", {})
  168. end
  169. assert(string.format("\0%s\0", "\0\0\1") == "\0\0\0\1\0")
  170. checkerror("contains zeros", string.format, "%10s", "\0")
  171. -- format x tostring
  172. assert(string.format("%s %s", nil, true) == "nil true")
  173. assert(string.format("%s %.4s", false, true) == "false true")
  174. assert(string.format("%.3s %.3s", false, true) == "fal tru")
  175. local m = setmetatable({}, {__tostring = function () return "hello" end,
  176. __name = "hi"})
  177. assert(string.format("%s %.10s", m, m) == "hello hello")
  178. getmetatable(m).__tostring = nil -- will use '__name' from now on
  179. assert(string.format("%.4s", m) == "hi: ")
  180. getmetatable(m).__tostring = function () return {} end
  181. checkerror("'__tostring' must return a string", tostring, m)
  182. assert(string.format("%x", 0.0) == "0")
  183. assert(string.format("%02x", 0.0) == "00")
  184. assert(string.format("%08X", 0xFFFFFFFF) == "FFFFFFFF")
  185. assert(string.format("%+08d", 31501) == "+0031501")
  186. assert(string.format("%+08d", -30927) == "-0030927")
  187. do -- longest number that can be formatted
  188. local i = 1
  189. local j = 10000
  190. while i + 1 < j do -- binary search for maximum finite float
  191. local m = (i + j) // 2
  192. if 10^m < math.huge then i = m else j = m end
  193. end
  194. assert(10^i < math.huge and 10^j == math.huge)
  195. local s = string.format('%.99f', -(10^i))
  196. assert(string.len(s) >= i + 101)
  197. assert(tonumber(s) == -(10^i))
  198. end
  199. -- testing large numbers for format
  200. do -- assume at least 32 bits
  201. local max, min = 0x7fffffff, -0x80000000 -- "large" for 32 bits
  202. assert(string.sub(string.format("%8x", -1), -8) == "ffffffff")
  203. assert(string.format("%x", max) == "7fffffff")
  204. assert(string.sub(string.format("%x", min), -8) == "80000000")
  205. assert(string.format("%d", max) == "2147483647")
  206. assert(string.format("%d", min) == "-2147483648")
  207. assert(string.format("%u", 0xffffffff) == "4294967295")
  208. assert(string.format("%o", 0xABCD) == "125715")
  209. max, min = 0x7fffffffffffffff, -0x8000000000000000
  210. if max > 2.0^53 then -- only for 64 bits
  211. assert(string.format("%x", (2^52 | 0) - 1) == "fffffffffffff")
  212. assert(string.format("0x%8X", 0x8f000003) == "0x8F000003")
  213. assert(string.format("%d", 2^53) == "9007199254740992")
  214. assert(string.format("%i", -2^53) == "-9007199254740992")
  215. assert(string.format("%x", max) == "7fffffffffffffff")
  216. assert(string.format("%x", min) == "8000000000000000")
  217. assert(string.format("%d", max) == "9223372036854775807")
  218. assert(string.format("%d", min) == "-9223372036854775808")
  219. assert(string.format("%u", ~(-1 << 64)) == "18446744073709551615")
  220. assert(tostring(1234567890123) == '1234567890123')
  221. end
  222. end
  223. do print("testing 'format %a %A'")
  224. local function matchhexa (n)
  225. local s = string.format("%a", n)
  226. -- result matches ISO C requirements
  227. assert(string.find(s, "^%-?0x[1-9a-f]%.?[0-9a-f]*p[-+]?%d+$"))
  228. assert(tonumber(s) == n) -- and has full precision
  229. s = string.format("%A", n)
  230. assert(string.find(s, "^%-?0X[1-9A-F]%.?[0-9A-F]*P[-+]?%d+$"))
  231. assert(tonumber(s) == n)
  232. end
  233. for _, n in ipairs{0.1, -0.1, 1/3, -1/3, 1e30, -1e30,
  234. -45/247, 1, -1, 2, -2, 3e-20, -3e-20} do
  235. matchhexa(n)
  236. end
  237. assert(string.find(string.format("%A", 0.0), "^0X0%.?0*P%+?0$"))
  238. assert(string.find(string.format("%a", -0.0), "^%-0x0%.?0*p%+?0$"))
  239. if not _port then -- test inf, -inf, NaN, and -0.0
  240. assert(string.find(string.format("%a", 1/0), "^inf"))
  241. assert(string.find(string.format("%A", -1/0), "^%-INF"))
  242. assert(string.find(string.format("%a", 0/0), "^%-?nan"))
  243. assert(string.find(string.format("%a", -0.0), "^%-0x0"))
  244. end
  245. if not pcall(string.format, "%.3a", 0) then
  246. (Message or print)("\n >>> modifiers for format '%a' not available <<<\n")
  247. else
  248. assert(string.find(string.format("%+.2A", 12), "^%+0X%x%.%x0P%+?%d$"))
  249. assert(string.find(string.format("%.4A", -12), "^%-0X%x%.%x000P%+?%d$"))
  250. end
  251. end
  252. -- errors in format
  253. local function check (fmt, msg)
  254. checkerror(msg, string.format, fmt, 10)
  255. end
  256. local aux = string.rep('0', 600)
  257. check("%100.3d", "too long")
  258. check("%1"..aux..".3d", "too long")
  259. check("%1.100d", "too long")
  260. check("%10.1"..aux.."004d", "too long")
  261. check("%t", "invalid option")
  262. check("%"..aux.."d", "repeated flags")
  263. check("%d %d", "no value")
  264. assert(load("return 1\n--comment without ending EOL")() == 1)
  265. checkerror("table expected", table.concat, 3)
  266. assert(table.concat{} == "")
  267. assert(table.concat({}, 'x') == "")
  268. assert(table.concat({'\0', '\0\1', '\0\1\2'}, '.\0.') == "\0.\0.\0\1.\0.\0\1\2")
  269. local a = {}; for i=1,300 do a[i] = "xuxu" end
  270. assert(table.concat(a, "123").."123" == string.rep("xuxu123", 300))
  271. assert(table.concat(a, "b", 20, 20) == "xuxu")
  272. assert(table.concat(a, "", 20, 21) == "xuxuxuxu")
  273. assert(table.concat(a, "x", 22, 21) == "")
  274. assert(table.concat(a, "3", 299) == "xuxu3xuxu")
  275. assert(table.concat({}, "x", maxi, maxi - 1) == "")
  276. assert(table.concat({}, "x", mini + 1, mini) == "")
  277. assert(table.concat({}, "x", maxi, mini) == "")
  278. assert(table.concat({[maxi] = "alo"}, "x", maxi, maxi) == "alo")
  279. assert(table.concat({[maxi] = "alo", [maxi - 1] = "y"}, "-", maxi - 1, maxi)
  280. == "y-alo")
  281. assert(not pcall(table.concat, {"a", "b", {}}))
  282. a = {"a","b","c"}
  283. assert(table.concat(a, ",", 1, 0) == "")
  284. assert(table.concat(a, ",", 1, 1) == "a")
  285. assert(table.concat(a, ",", 1, 2) == "a,b")
  286. assert(table.concat(a, ",", 2) == "b,c")
  287. assert(table.concat(a, ",", 3) == "c")
  288. assert(table.concat(a, ",", 4) == "")
  289. if not _port then
  290. local locales = { "ptb", "pt_BR.iso88591", "ISO-8859-1" }
  291. local function trylocale (w)
  292. for i = 1, #locales do
  293. if os.setlocale(locales[i], w) then
  294. print(string.format("'%s' locale set to '%s'", w, locales[i]))
  295. return locales[i]
  296. end
  297. end
  298. print(string.format("'%s' locale not found", w))
  299. return false
  300. end
  301. if trylocale("collate") then
  302. assert("alo" < "álo" and "álo" < "amo")
  303. end
  304. if trylocale("ctype") then
  305. assert(string.gsub("áéíóú", "%a", "x") == "xxxxx")
  306. assert(string.gsub("áÁéÉ", "%l", "x") == "xÁxÉ")
  307. assert(string.gsub("áÁéÉ", "%u", "x") == "áxéx")
  308. assert(string.upper"áÁé{xuxu}ção" == "ÁÁÉ{XUXU}ÇÃO")
  309. end
  310. os.setlocale("C")
  311. assert(os.setlocale() == 'C')
  312. assert(os.setlocale(nil, "numeric") == 'C')
  313. end
  314. -- bug in Lua 5.3.2
  315. -- 'gmatch' iterator does not work across coroutines
  316. do
  317. local f = string.gmatch("1 2 3 4 5", "%d+")
  318. assert(f() == "1")
  319. co = coroutine.wrap(f)
  320. assert(co() == "2")
  321. end
  322. print('OK')