dump.lua 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634
  1. ----------------------------------------------------------------------------
  2. -- LuaJIT compiler dump module.
  3. --
  4. -- Copyright (C) 2005-2010 Mike Pall. All rights reserved.
  5. -- Released under the MIT/X license. See Copyright Notice in luajit.h
  6. ----------------------------------------------------------------------------
  7. --
  8. -- This module can be used to debug the JIT compiler itself. It dumps the
  9. -- code representations and structures used in various compiler stages.
  10. --
  11. -- Example usage:
  12. --
  13. -- luajit -jdump -e "local x=0; for i=1,1e6 do x=x+i end; print(x)"
  14. -- luajit -jdump=im -e "for i=1,1000 do for j=1,1000 do end end" | less -R
  15. -- luajit -jdump=is myapp.lua | less -R
  16. -- luajit -jdump=-b myapp.lua
  17. -- luajit -jdump=+aH,myapp.html myapp.lua
  18. -- luajit -jdump=ixT,myapp.dump myapp.lua
  19. --
  20. -- The first argument specifies the dump mode. The second argument gives
  21. -- the output file name. Default output is to stdout, unless the environment
  22. -- variable LUAJIT_DUMPFILE is set. The file is overwritten every time the
  23. -- module is started.
  24. --
  25. -- Different features can be turned on or off with the dump mode. If the
  26. -- mode starts with a '+', the following features are added to the default
  27. -- set of features; a '-' removes them. Otherwise the features are replaced.
  28. --
  29. -- The following dump features are available (* marks the default):
  30. --
  31. -- * t Print a line for each started, ended or aborted trace (see also -jv).
  32. -- * b Dump the traced bytecode.
  33. -- * i Dump the IR (intermediate representation).
  34. -- r Augment the IR with register/stack slots.
  35. -- s Dump the snapshot map.
  36. -- * m Dump the generated machine code.
  37. -- x Print each taken trace exit.
  38. -- X Print each taken trace exit and the contents of all registers.
  39. --
  40. -- The output format can be set with the following characters:
  41. --
  42. -- T Plain text output.
  43. -- A ANSI-colored text output
  44. -- H Colorized HTML + CSS output.
  45. --
  46. -- The default output format is plain text. It's set to ANSI-colored text
  47. -- if the COLORTERM variable is set. Note: this is independent of any output
  48. -- redirection, which is actually considered a feature.
  49. --
  50. -- You probably want to use less -R to enjoy viewing ANSI-colored text from
  51. -- a pipe or a file. Add this to your ~/.bashrc: export LESS="-R"
  52. --
  53. ------------------------------------------------------------------------------
  54. -- Cache some library functions and objects.
  55. local jit = require("jit")
  56. assert(jit.version_num == 20000, "LuaJIT core/library version mismatch")
  57. local jutil = require("jit.util")
  58. local vmdef = require("jit.vmdef")
  59. local funcinfo, funcbc = jutil.funcinfo, jutil.funcbc
  60. local traceinfo, traceir, tracek = jutil.traceinfo, jutil.traceir, jutil.tracek
  61. local tracemc, tracesnap = jutil.tracemc, jutil.tracesnap
  62. local traceexitstub, ircalladdr = jutil.traceexitstub, jutil.ircalladdr
  63. local bit = require("bit")
  64. local band, shl, shr = bit.band, bit.lshift, bit.rshift
  65. local sub, gsub, format = string.sub, string.gsub, string.format
  66. local byte, char, rep = string.byte, string.char, string.rep
  67. local type, tostring = type, tostring
  68. local stdout, stderr = io.stdout, io.stderr
  69. -- Load other modules on-demand.
  70. local bcline, discreate
  71. -- Active flag, output file handle and dump mode.
  72. local active, out, dumpmode
  73. ------------------------------------------------------------------------------
  74. local symtab = {}
  75. local nexitsym = 0
  76. -- Fill symbol table with trace exit addresses.
  77. local function fillsymtab(nexit)
  78. local t = symtab
  79. if nexitsym == 0 then
  80. local ircall = vmdef.ircall
  81. for i=0,#ircall do t[ircalladdr(i)] = ircall[i] end
  82. end
  83. if nexit > nexitsym then
  84. for i=nexitsym,nexit-1 do t[traceexitstub(i)] = tostring(i) end
  85. nexitsym = nexit
  86. end
  87. return t
  88. end
  89. local function dumpwrite(s)
  90. out:write(s)
  91. end
  92. -- Disassemble machine code.
  93. local function dump_mcode(tr)
  94. local info = traceinfo(tr)
  95. if not info then return end
  96. local mcode, addr, loop = tracemc(tr)
  97. if not mcode then return end
  98. if not discreate then
  99. discreate = require("jit.dis_"..jit.arch).create
  100. end
  101. out:write("---- TRACE ", tr, " mcode ", #mcode, "\n")
  102. local ctx = discreate(mcode, addr, dumpwrite)
  103. ctx.hexdump = 0
  104. ctx.symtab = fillsymtab(info.nexit)
  105. if loop ~= 0 then
  106. symtab[addr+loop] = "LOOP"
  107. ctx:disass(0, loop)
  108. out:write("->LOOP:\n")
  109. ctx:disass(loop, #mcode-loop)
  110. symtab[addr+loop] = nil
  111. else
  112. ctx:disass(0, #mcode)
  113. end
  114. end
  115. ------------------------------------------------------------------------------
  116. local irtype_text = {
  117. [0] = "nil",
  118. "fal",
  119. "tru",
  120. "lud",
  121. "str",
  122. "p32",
  123. "thr",
  124. "pro",
  125. "fun",
  126. "p64",
  127. "cdt",
  128. "tab",
  129. "udt",
  130. "flt",
  131. "num",
  132. "i8 ",
  133. "u8 ",
  134. "i16",
  135. "u16",
  136. "int",
  137. "u32",
  138. "i64",
  139. "u64",
  140. }
  141. local colortype_ansi = {
  142. [0] = "%s",
  143. "%s",
  144. "%s",
  145. "\027[36m%s\027[m",
  146. "\027[32m%s\027[m",
  147. "%s",
  148. "\027[1m%s\027[m",
  149. "%s",
  150. "\027[1m%s\027[m",
  151. "%s",
  152. "\027[33m%s\027[m",
  153. "\027[31m%s\027[m",
  154. "\027[36m%s\027[m",
  155. "\027[34m%s\027[m",
  156. "\027[34m%s\027[m",
  157. "\027[35m%s\027[m",
  158. "\027[35m%s\027[m",
  159. "\027[35m%s\027[m",
  160. "\027[35m%s\027[m",
  161. "\027[35m%s\027[m",
  162. "\027[35m%s\027[m",
  163. "\027[35m%s\027[m",
  164. "\027[35m%s\027[m",
  165. }
  166. local function colorize_text(s, t)
  167. return s
  168. end
  169. local function colorize_ansi(s, t)
  170. return format(colortype_ansi[t], s)
  171. end
  172. local irtype_ansi = setmetatable({},
  173. { __index = function(tab, t)
  174. local s = colorize_ansi(irtype_text[t], t); tab[t] = s; return s; end })
  175. local html_escape = { ["<"] = "&lt;", [">"] = "&gt;", ["&"] = "&amp;", }
  176. local function colorize_html(s, t)
  177. s = gsub(s, "[<>&]", html_escape)
  178. return format('<span class="irt_%s">%s</span>', irtype_text[t], s)
  179. end
  180. local irtype_html = setmetatable({},
  181. { __index = function(tab, t)
  182. local s = colorize_html(irtype_text[t], t); tab[t] = s; return s; end })
  183. local header_html = [[
  184. <style type="text/css">
  185. background { background: #ffffff; color: #000000; }
  186. pre.ljdump {
  187. font-size: 10pt;
  188. background: #f0f4ff;
  189. color: #000000;
  190. border: 1px solid #bfcfff;
  191. padding: 0.5em;
  192. margin-left: 2em;
  193. margin-right: 2em;
  194. }
  195. span.irt_str { color: #00a000; }
  196. span.irt_thr, span.irt_fun { color: #404040; font-weight: bold; }
  197. span.irt_tab { color: #c00000; }
  198. span.irt_udt, span.irt_lud { color: #00c0c0; }
  199. span.irt_num { color: #4040c0; }
  200. span.irt_int, span.irt_i8, span.irt_u8, span.irt_i16, span.irt_u16 { color: #b040b0; }
  201. </style>
  202. ]]
  203. local colorize, irtype
  204. -- Lookup tables to convert some literals into names.
  205. local tointname = { [0] = "check", "index", "", "Z", "S", "T", }
  206. local litname = {
  207. ["SLOAD "] = setmetatable({}, { __index = function(t, mode)
  208. local s = ""
  209. if band(mode, 1) ~= 0 then s = s.."P" end
  210. if band(mode, 2) ~= 0 then s = s.."F" end
  211. if band(mode, 4) ~= 0 then s = s.."T" end
  212. if band(mode, 8) ~= 0 then s = s.."C" end
  213. if band(mode, 16) ~= 0 then s = s.."R" end
  214. if band(mode, 32) ~= 0 then s = s.."I" end
  215. t[mode] = s
  216. return s
  217. end}),
  218. ["XLOAD "] = { [0] = "", "R", "U", "RU", },
  219. ["TOINT "] = tointname,
  220. ["TOI64 "] = tointname,
  221. ["FLOAD "] = vmdef.irfield,
  222. ["FREF "] = vmdef.irfield,
  223. ["FPMATH"] = vmdef.irfpm,
  224. }
  225. local function ctlsub(c)
  226. if c == "\n" then return "\\n"
  227. elseif c == "\r" then return "\\r"
  228. elseif c == "\t" then return "\\t"
  229. elseif c == "\r" then return "\\r"
  230. else return format("\\%03d", byte(c))
  231. end
  232. end
  233. local function fmtfunc(func, pc)
  234. local fi = funcinfo(func, pc)
  235. if fi.loc then
  236. return fi.loc
  237. elseif fi.ffid then
  238. return vmdef.ffnames[fi.ffid]
  239. elseif fi.addr then
  240. return format("C:%x", fi.addr)
  241. else
  242. return "(?)"
  243. end
  244. end
  245. local function formatk(tr, idx)
  246. local k, t, slot = tracek(tr, idx)
  247. local tn = type(k)
  248. local s
  249. if tn == "number" then
  250. if k == 2^52+2^51 then
  251. s = "bias"
  252. else
  253. s = format("%+.14g", k)
  254. end
  255. elseif tn == "string" then
  256. s = format(#k > 20 and '"%.20s"~' or '"%s"', gsub(k, "%c", ctlsub))
  257. elseif tn == "function" then
  258. s = fmtfunc(k)
  259. elseif tn == "table" then
  260. s = format("{%p}", k)
  261. elseif tn == "userdata" then
  262. if t == 12 then
  263. s = format("userdata:%p", k)
  264. else
  265. s = format("[%p]", k)
  266. if s == "[0x00000000]" then s = "NULL" end
  267. end
  268. else
  269. s = tostring(k) -- For primitives.
  270. end
  271. s = colorize(format("%-4s", s), t)
  272. if slot then
  273. s = format("%s @%d", s, slot)
  274. end
  275. return s
  276. end
  277. local function printsnap(tr, snap)
  278. local n = 2
  279. for s=0,snap[1]-1 do
  280. local sn = snap[n]
  281. if shr(sn, 24) == s then
  282. n = n + 1
  283. local ref = band(sn, 0xffff) - 0x8000 -- REF_BIAS
  284. if ref < 0 then
  285. out:write(formatk(tr, ref))
  286. else
  287. local m, ot, op1, op2 = traceir(tr, ref)
  288. out:write(colorize(format("%04d", ref), band(ot, 31)))
  289. end
  290. out:write(band(sn, 0x10000) == 0 and " " or "|") -- SNAP_FRAME
  291. else
  292. out:write("---- ")
  293. end
  294. end
  295. out:write("]\n")
  296. end
  297. -- Dump snapshots (not interleaved with IR).
  298. local function dump_snap(tr)
  299. out:write("---- TRACE ", tr, " snapshots\n")
  300. for i=0,1000000000 do
  301. local snap = tracesnap(tr, i)
  302. if not snap then break end
  303. out:write(format("#%-3d %04d [ ", i, snap[0]))
  304. printsnap(tr, snap)
  305. end
  306. end
  307. -- NYI: should really get the register map from the disassembler.
  308. local reg_map = ({
  309. x86 = {
  310. [0] = "eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi",
  311. "xmm0", "xmm1", "xmm2", "xmm3", "xmm4", "xmm5", "xmm6", "xmm7",
  312. },
  313. x64 = {
  314. [0] = "rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi",
  315. "r8", "r9", "r10", "r11", "r12", "r13", "r14", "r15",
  316. "xmm0", "xmm1", "xmm2", "xmm3", "xmm4", "xmm5", "xmm6", "xmm7",
  317. "xmm8", "xmm9", "xmm10", "xmm11", "xmm12", "xmm13", "xmm14", "xmm15",
  318. }
  319. })[jit.arch]
  320. -- Return a register name or stack slot for a rid/sp location.
  321. local function ridsp_name(ridsp)
  322. local rid = band(ridsp, 0xff)
  323. if ridsp > 255 then return format("[%x]", shr(ridsp, 8)*4) end
  324. if rid < 128 then return reg_map[rid] end
  325. return ""
  326. end
  327. -- Recursively gather CALL* args and dump them.
  328. local function dumpcallargs(tr, ins)
  329. if ins < 0 then
  330. out:write(formatk(tr, ins))
  331. else
  332. local m, ot, op1, op2 = traceir(tr, ins)
  333. local oidx = 6*shr(ot, 8)
  334. local op = sub(vmdef.irnames, oidx+1, oidx+6)
  335. if op == "CARG " then
  336. dumpcallargs(tr, op1)
  337. if op2 < 0 then
  338. out:write(" ", formatk(tr, op2))
  339. else
  340. out:write(" ", format("%04d", op2))
  341. end
  342. else
  343. out:write(format("%04d", ins))
  344. end
  345. end
  346. end
  347. -- Dump IR and interleaved snapshots.
  348. local function dump_ir(tr, dumpsnap, dumpreg)
  349. local info = traceinfo(tr)
  350. if not info then return end
  351. local nins = info.nins
  352. out:write("---- TRACE ", tr, " IR\n")
  353. local irnames = vmdef.irnames
  354. local snapref = 65536
  355. local snap, snapno
  356. if dumpsnap then
  357. snap = tracesnap(tr, 0)
  358. snapref = snap[0]
  359. snapno = 0
  360. end
  361. for ins=1,nins do
  362. if ins >= snapref then
  363. if dumpreg then
  364. out:write(format(".... SNAP #%-3d [ ", snapno))
  365. else
  366. out:write(format(".... SNAP #%-3d [ ", snapno))
  367. end
  368. printsnap(tr, snap)
  369. snapno = snapno + 1
  370. snap = tracesnap(tr, snapno)
  371. snapref = snap and snap[0] or 65536
  372. end
  373. local m, ot, op1, op2, ridsp = traceir(tr, ins)
  374. local oidx, t = 6*shr(ot, 8), band(ot, 31)
  375. local op = sub(irnames, oidx+1, oidx+6)
  376. if op == "LOOP " then
  377. if dumpreg then
  378. out:write(format("%04d ------------ LOOP ------------\n", ins))
  379. else
  380. out:write(format("%04d ------ LOOP ------------\n", ins))
  381. end
  382. elseif op ~= "NOP " and op ~= "CARG " and
  383. (dumpreg or op ~= "RENAME") then
  384. if dumpreg then
  385. out:write(format("%04d %-5s ", ins, ridsp_name(ridsp)))
  386. else
  387. out:write(format("%04d ", ins))
  388. end
  389. out:write(format("%s%s %s %s ",
  390. band(ot, 128) == 0 and " " or ">",
  391. band(ot, 64) == 0 and " " or "+",
  392. irtype[t], op))
  393. local m1 = band(m, 3)
  394. if sub(op, 1, 4) == "CALL" then
  395. out:write(format("%-10s (", vmdef.ircall[op2]))
  396. if op1 ~= -1 then dumpcallargs(tr, op1) end
  397. out:write(")")
  398. elseif op == "CNEW " and op2 == -1 then
  399. out:write(formatk(tr, op1))
  400. elseif m1 ~= 3 then -- op1 != IRMnone
  401. if op1 < 0 then
  402. out:write(formatk(tr, op1))
  403. else
  404. out:write(format(m1 == 0 and "%04d" or "#%-3d", op1))
  405. end
  406. local m2 = band(m, 3*4)
  407. if m2 ~= 3*4 then -- op2 != IRMnone
  408. if m2 == 1*4 then -- op2 == IRMlit
  409. local litn = litname[op]
  410. if litn and litn[op2] then
  411. out:write(" ", litn[op2])
  412. elseif op == "UREFO " or op == "UREFC " then
  413. out:write(format(" #%-3d", shr(op2, 8)))
  414. else
  415. out:write(format(" #%-3d", op2))
  416. end
  417. elseif op2 < 0 then
  418. out:write(" ", formatk(tr, op2))
  419. else
  420. out:write(format(" %04d", op2))
  421. end
  422. end
  423. end
  424. out:write("\n")
  425. end
  426. end
  427. if snap then
  428. if dumpreg then
  429. out:write(format(".... SNAP #%-3d [ ", snapno))
  430. else
  431. out:write(format(".... SNAP #%-3d [ ", snapno))
  432. end
  433. printsnap(tr, snap)
  434. end
  435. end
  436. ------------------------------------------------------------------------------
  437. local recprefix = ""
  438. local recdepth = 0
  439. -- Format trace error message.
  440. local function fmterr(err, info)
  441. if type(err) == "number" then
  442. if type(info) == "function" then info = fmtfunc(info) end
  443. err = format(vmdef.traceerr[err], info)
  444. end
  445. return err
  446. end
  447. -- Dump trace states.
  448. local function dump_trace(what, tr, func, pc, otr, oex)
  449. if what == "stop" or (what == "abort" and dumpmode.a) then
  450. if dumpmode.i then dump_ir(tr, dumpmode.s, dumpmode.r and what == "stop")
  451. elseif dumpmode.s then dump_snap(tr) end
  452. if dumpmode.m then dump_mcode(tr) end
  453. end
  454. if what == "start" then
  455. if dumpmode.H then out:write('<pre class="ljdump">\n') end
  456. out:write("---- TRACE ", tr, " ", what)
  457. if otr then out:write(" ", otr, "/", oex) end
  458. out:write(" ", fmtfunc(func, pc), "\n")
  459. recprefix = ""
  460. elseif what == "stop" or what == "abort" then
  461. out:write("---- TRACE ", tr, " ", what)
  462. recprefix = nil
  463. if what == "abort" then
  464. out:write(" ", fmtfunc(func, pc), " -- ", fmterr(otr, oex), "\n")
  465. else
  466. local link = traceinfo(tr).link
  467. if link == tr then
  468. link = "loop"
  469. elseif link == 0 then
  470. link = "interpreter"
  471. end
  472. out:write(" -> ", link, "\n")
  473. end
  474. if dumpmode.H then out:write("</pre>\n\n") else out:write("\n") end
  475. else
  476. out:write("---- TRACE ", what, "\n\n")
  477. end
  478. out:flush()
  479. end
  480. -- Dump recorded bytecode.
  481. local function dump_record(tr, func, pc, depth, callee)
  482. if depth ~= recdepth then
  483. recdepth = depth
  484. recprefix = rep(" .", depth)
  485. end
  486. local line
  487. if pc >= 0 then
  488. line = bcline(func, pc, recprefix)
  489. if dumpmode.H then line = gsub(line, "[<>&]", html_escape) end
  490. else
  491. line = "0000 "..recprefix.." FUNCC \n"
  492. callee = func
  493. end
  494. if pc <= 0 then
  495. out:write(sub(line, 1, -2), " ; ", fmtfunc(func), "\n")
  496. else
  497. out:write(line)
  498. end
  499. if pc >= 0 and band(funcbc(func, pc), 0xff) < 16 then -- ORDER BC
  500. out:write(bcline(func, pc+1, recprefix)) -- Write JMP for cond.
  501. end
  502. end
  503. ------------------------------------------------------------------------------
  504. -- Dump taken trace exits.
  505. local function dump_texit(tr, ex, ngpr, nfpr, ...)
  506. out:write("---- TRACE ", tr, " exit ", ex, "\n")
  507. if dumpmode.X then
  508. local regs = {...}
  509. if jit.arch == "x64" then
  510. for i=1,ngpr do
  511. out:write(format(" %016x", regs[i]))
  512. if i % 4 == 0 then out:write("\n") end
  513. end
  514. else
  515. for i=1,ngpr do
  516. out:write(format(" %08x", regs[i]))
  517. if i % 8 == 0 then out:write("\n") end
  518. end
  519. end
  520. for i=1,nfpr do
  521. out:write(format(" %+17.14g", regs[ngpr+i]))
  522. if i % 4 == 0 then out:write("\n") end
  523. end
  524. end
  525. end
  526. ------------------------------------------------------------------------------
  527. -- Detach dump handlers.
  528. local function dumpoff()
  529. if active then
  530. active = false
  531. jit.attach(dump_texit)
  532. jit.attach(dump_record)
  533. jit.attach(dump_trace)
  534. if out and out ~= stdout and out ~= stderr then out:close() end
  535. out = nil
  536. end
  537. end
  538. -- Open the output file and attach dump handlers.
  539. local function dumpon(opt, outfile)
  540. if active then dumpoff() end
  541. local colormode = os.getenv("COLORTERM") and "A" or "T"
  542. if opt then
  543. opt = gsub(opt, "[TAH]", function(mode) colormode = mode; return ""; end)
  544. end
  545. local m = { t=true, b=true, i=true, m=true, }
  546. if opt and opt ~= "" then
  547. local o = sub(opt, 1, 1)
  548. if o ~= "+" and o ~= "-" then m = {} end
  549. for i=1,#opt do m[sub(opt, i, i)] = (o ~= "-") end
  550. end
  551. dumpmode = m
  552. if m.t or m.b or m.i or m.s or m.m then
  553. jit.attach(dump_trace, "trace")
  554. end
  555. if m.b then
  556. jit.attach(dump_record, "record")
  557. if not bcline then bcline = require("jit.bc").line end
  558. end
  559. if m.x or m.X then
  560. jit.attach(dump_texit, "texit")
  561. end
  562. if not outfile then outfile = os.getenv("LUAJIT_DUMPFILE") end
  563. if outfile then
  564. out = outfile == "-" and stdout or assert(io.open(outfile, "w"))
  565. else
  566. out = stdout
  567. end
  568. m[colormode] = true
  569. if colormode == "A" then
  570. colorize = colorize_ansi
  571. irtype = irtype_ansi
  572. elseif colormode == "H" then
  573. colorize = colorize_html
  574. irtype = irtype_html
  575. out:write(header_html)
  576. else
  577. colorize = colorize_text
  578. irtype = irtype_text
  579. end
  580. active = true
  581. end
  582. -- Public module functions.
  583. module(...)
  584. on = dumpon
  585. off = dumpoff
  586. start = dumpon -- For -j command line option.