lj_emit_mips.h 8.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310
  1. /*
  2. ** MIPS instruction emitter.
  3. ** Copyright (C) 2005-2023 Mike Pall. See Copyright Notice in luajit.h
  4. */
  5. #if LJ_64
  6. static intptr_t get_k64val(ASMState *as, IRRef ref)
  7. {
  8. IRIns *ir = IR(ref);
  9. if (ir->o == IR_KINT64) {
  10. return (intptr_t)ir_kint64(ir)->u64;
  11. } else if (ir->o == IR_KGC) {
  12. return (intptr_t)ir_kgc(ir);
  13. } else if (ir->o == IR_KPTR || ir->o == IR_KKPTR) {
  14. return (intptr_t)ir_kptr(ir);
  15. } else if (LJ_SOFTFP && ir->o == IR_KNUM) {
  16. return (intptr_t)ir_knum(ir)->u64;
  17. } else {
  18. lj_assertA(ir->o == IR_KINT || ir->o == IR_KNULL,
  19. "bad 64 bit const IR op %d", ir->o);
  20. return ir->i; /* Sign-extended. */
  21. }
  22. }
  23. #endif
  24. #if LJ_64
  25. #define get_kval(as, ref) get_k64val(as, ref)
  26. #else
  27. #define get_kval(as, ref) (IR((ref))->i)
  28. #endif
  29. /* -- Emit basic instructions --------------------------------------------- */
  30. static void emit_dst(ASMState *as, MIPSIns mi, Reg rd, Reg rs, Reg rt)
  31. {
  32. *--as->mcp = mi | MIPSF_D(rd) | MIPSF_S(rs) | MIPSF_T(rt);
  33. }
  34. static void emit_dta(ASMState *as, MIPSIns mi, Reg rd, Reg rt, uint32_t a)
  35. {
  36. *--as->mcp = mi | MIPSF_D(rd) | MIPSF_T(rt) | MIPSF_A(a);
  37. }
  38. #define emit_ds(as, mi, rd, rs) emit_dst(as, (mi), (rd), (rs), 0)
  39. #define emit_tg(as, mi, rt, rg) emit_dst(as, (mi), (rg)&31, 0, (rt))
  40. static void emit_tsi(ASMState *as, MIPSIns mi, Reg rt, Reg rs, int32_t i)
  41. {
  42. *--as->mcp = mi | MIPSF_T(rt) | MIPSF_S(rs) | (i & 0xffff);
  43. }
  44. #define emit_ti(as, mi, rt, i) emit_tsi(as, (mi), (rt), 0, (i))
  45. #define emit_hsi(as, mi, rh, rs, i) emit_tsi(as, (mi), (rh) & 31, (rs), (i))
  46. static void emit_fgh(ASMState *as, MIPSIns mi, Reg rf, Reg rg, Reg rh)
  47. {
  48. *--as->mcp = mi | MIPSF_F(rf&31) | MIPSF_G(rg&31) | MIPSF_H(rh&31);
  49. }
  50. #define emit_fg(as, mi, rf, rg) emit_fgh(as, (mi), (rf), (rg), 0)
  51. static void emit_rotr(ASMState *as, Reg dest, Reg src, Reg tmp, uint32_t shift)
  52. {
  53. if (LJ_64 || (as->flags & JIT_F_MIPSXXR2)) {
  54. emit_dta(as, MIPSI_ROTR, dest, src, shift);
  55. } else {
  56. emit_dst(as, MIPSI_OR, dest, dest, tmp);
  57. emit_dta(as, MIPSI_SLL, dest, src, (-shift)&31);
  58. emit_dta(as, MIPSI_SRL, tmp, src, shift);
  59. }
  60. }
  61. #if LJ_64 || LJ_HASBUFFER
  62. static void emit_tsml(ASMState *as, MIPSIns mi, Reg rt, Reg rs, uint32_t msb,
  63. uint32_t lsb)
  64. {
  65. *--as->mcp = mi | MIPSF_T(rt) | MIPSF_S(rs) | MIPSF_M(msb) | MIPSF_L(lsb);
  66. }
  67. #endif
  68. /* -- Emit loads/stores --------------------------------------------------- */
  69. /* Prefer rematerialization of BASE/L from global_State over spills. */
  70. #define emit_canremat(ref) ((ref) <= REF_BASE)
  71. /* Try to find a one step delta relative to another constant. */
  72. static int emit_kdelta1(ASMState *as, Reg rd, intptr_t i)
  73. {
  74. RegSet work = ~as->freeset & RSET_GPR;
  75. while (work) {
  76. Reg r = rset_picktop(work);
  77. IRRef ref = regcost_ref(as->cost[r]);
  78. lj_assertA(r != rd, "dest reg %d not free", rd);
  79. if (ref < ASMREF_L) {
  80. intptr_t delta = (intptr_t)((uintptr_t)i -
  81. (uintptr_t)(ra_iskref(ref) ? ra_krefk(as, ref) : get_kval(as, ref)));
  82. if (checki16(delta)) {
  83. emit_tsi(as, MIPSI_AADDIU, rd, r, delta);
  84. return 1;
  85. }
  86. }
  87. rset_clear(work, r);
  88. }
  89. return 0; /* Failed. */
  90. }
  91. /* Load a 32 bit constant into a GPR. */
  92. static void emit_loadi(ASMState *as, Reg r, int32_t i)
  93. {
  94. if (checki16(i)) {
  95. emit_ti(as, MIPSI_LI, r, i);
  96. } else {
  97. if ((i & 0xffff)) {
  98. intptr_t jgl = (intptr_t)(void *)J2G(as->J);
  99. if ((uintptr_t)(i-jgl) < 65536) {
  100. emit_tsi(as, MIPSI_ADDIU, r, RID_JGL, i-jgl-32768);
  101. return;
  102. } else if (emit_kdelta1(as, r, i)) {
  103. return;
  104. } else if ((i >> 16) == 0) {
  105. emit_tsi(as, MIPSI_ORI, r, RID_ZERO, i);
  106. return;
  107. }
  108. emit_tsi(as, MIPSI_ORI, r, r, i);
  109. }
  110. emit_ti(as, MIPSI_LUI, r, (i >> 16));
  111. }
  112. }
  113. #if LJ_64
  114. /* Load a 64 bit constant into a GPR. */
  115. static void emit_loadu64(ASMState *as, Reg r, uint64_t u64)
  116. {
  117. if (checki32((int64_t)u64)) {
  118. emit_loadi(as, r, (int32_t)u64);
  119. } else {
  120. uint64_t delta = u64 - (uint64_t)(void *)J2G(as->J);
  121. if (delta < 65536) {
  122. emit_tsi(as, MIPSI_DADDIU, r, RID_JGL, (int32_t)(delta-32768));
  123. } else if (emit_kdelta1(as, r, (intptr_t)u64)) {
  124. return;
  125. } else {
  126. /* TODO MIPSR6: Use DAHI & DATI. Caveat: sign-extension. */
  127. if ((u64 & 0xffff)) {
  128. emit_tsi(as, MIPSI_ORI, r, r, u64 & 0xffff);
  129. }
  130. if (((u64 >> 16) & 0xffff)) {
  131. emit_dta(as, MIPSI_DSLL, r, r, 16);
  132. emit_tsi(as, MIPSI_ORI, r, r, (u64 >> 16) & 0xffff);
  133. emit_dta(as, MIPSI_DSLL, r, r, 16);
  134. } else {
  135. emit_dta(as, MIPSI_DSLL32, r, r, 0);
  136. }
  137. emit_loadi(as, r, (int32_t)(u64 >> 32));
  138. }
  139. /* TODO: There are probably more optimization opportunities. */
  140. }
  141. }
  142. #define emit_loada(as, r, addr) emit_loadu64(as, (r), u64ptr((addr)))
  143. #else
  144. #define emit_loada(as, r, addr) emit_loadi(as, (r), i32ptr((addr)))
  145. #endif
  146. static Reg ra_allock(ASMState *as, intptr_t k, RegSet allow);
  147. static void ra_allockreg(ASMState *as, intptr_t k, Reg r);
  148. /* Get/set from constant pointer. */
  149. static void emit_lsptr(ASMState *as, MIPSIns mi, Reg r, void *p, RegSet allow)
  150. {
  151. intptr_t jgl = (intptr_t)(J2G(as->J));
  152. intptr_t i = (intptr_t)(p);
  153. Reg base;
  154. if ((uint32_t)(i-jgl) < 65536) {
  155. i = i-jgl-32768;
  156. base = RID_JGL;
  157. } else {
  158. base = ra_allock(as, i-(int16_t)i, allow);
  159. }
  160. emit_tsi(as, mi, r, base, i);
  161. }
  162. #if LJ_64
  163. static void emit_loadk64(ASMState *as, Reg r, IRIns *ir)
  164. {
  165. const uint64_t *k = &ir_k64(ir)->u64;
  166. Reg r64 = r;
  167. if (rset_test(RSET_FPR, r)) {
  168. r64 = RID_TMP;
  169. emit_tg(as, MIPSI_DMTC1, r64, r);
  170. }
  171. if ((uint32_t)((intptr_t)k-(intptr_t)J2G(as->J)) < 65536)
  172. emit_lsptr(as, MIPSI_LD, r64, (void *)k, 0);
  173. else
  174. emit_loadu64(as, r64, *k);
  175. }
  176. #else
  177. #define emit_loadk64(as, r, ir) \
  178. emit_lsptr(as, MIPSI_LDC1, ((r) & 31), (void *)&ir_knum((ir))->u64, RSET_GPR)
  179. #endif
  180. /* Get/set global_State fields. */
  181. static void emit_lsglptr(ASMState *as, MIPSIns mi, Reg r, int32_t ofs)
  182. {
  183. emit_tsi(as, mi, r, RID_JGL, ofs-32768);
  184. }
  185. #define emit_getgl(as, r, field) \
  186. emit_lsglptr(as, MIPSI_AL, (r), (int32_t)offsetof(global_State, field))
  187. #define emit_setgl(as, r, field) \
  188. emit_lsglptr(as, MIPSI_AS, (r), (int32_t)offsetof(global_State, field))
  189. /* Trace number is determined from per-trace exit stubs. */
  190. #define emit_setvmstate(as, i) UNUSED(i)
  191. /* -- Emit control-flow instructions -------------------------------------- */
  192. /* Label for internal jumps. */
  193. typedef MCode *MCLabel;
  194. /* Return label pointing to current PC. */
  195. #define emit_label(as) ((as)->mcp)
  196. static void emit_branch(ASMState *as, MIPSIns mi, Reg rs, Reg rt, MCode *target)
  197. {
  198. MCode *p = as->mcp;
  199. ptrdiff_t delta = target - p;
  200. lj_assertA(((delta + 0x8000) >> 16) == 0, "branch target out of range");
  201. *--p = mi | MIPSF_S(rs) | MIPSF_T(rt) | ((uint32_t)delta & 0xffffu);
  202. as->mcp = p;
  203. }
  204. static void emit_jmp(ASMState *as, MCode *target)
  205. {
  206. *--as->mcp = MIPSI_NOP;
  207. emit_branch(as, MIPSI_B, RID_ZERO, RID_ZERO, (target));
  208. }
  209. static void emit_call(ASMState *as, void *target, int needcfa)
  210. {
  211. MCode *p = as->mcp;
  212. #if LJ_TARGET_MIPSR6
  213. ptrdiff_t delta = (char *)target - (char *)p;
  214. if ((((delta>>2) + 0x02000000) >> 26) == 0) { /* Try compact call first. */
  215. *--p = MIPSI_BALC | (((uintptr_t)delta >>2) & 0x03ffffffu);
  216. as->mcp = p;
  217. return;
  218. }
  219. #endif
  220. *--p = MIPSI_NOP; /* Delay slot. */
  221. if ((((uintptr_t)target ^ (uintptr_t)p) >> 28) == 0) {
  222. #if !LJ_TARGET_MIPSR6
  223. *--p = (((uintptr_t)target & 1) ? MIPSI_JALX : MIPSI_JAL) |
  224. (((uintptr_t)target >>2) & 0x03ffffffu);
  225. #else
  226. *--p = MIPSI_JAL | (((uintptr_t)target >>2) & 0x03ffffffu);
  227. #endif
  228. } else { /* Target out of range: need indirect call. */
  229. *--p = MIPSI_JALR | MIPSF_S(RID_CFUNCADDR);
  230. needcfa = 1;
  231. }
  232. as->mcp = p;
  233. if (needcfa) ra_allockreg(as, (intptr_t)target, RID_CFUNCADDR);
  234. }
  235. /* -- Emit generic operations --------------------------------------------- */
  236. #define emit_move(as, dst, src) \
  237. emit_ds(as, MIPSI_MOVE, (dst), (src))
  238. /* Generic move between two regs. */
  239. static void emit_movrr(ASMState *as, IRIns *ir, Reg dst, Reg src)
  240. {
  241. if (dst < RID_MAX_GPR)
  242. emit_move(as, dst, src);
  243. else
  244. emit_fg(as, irt_isnum(ir->t) ? MIPSI_MOV_D : MIPSI_MOV_S, dst, src);
  245. }
  246. /* Generic load of register with base and (small) offset address. */
  247. static void emit_loadofs(ASMState *as, IRIns *ir, Reg r, Reg base, int32_t ofs)
  248. {
  249. if (r < RID_MAX_GPR)
  250. emit_tsi(as, irt_is64(ir->t) ? MIPSI_LD : MIPSI_LW, r, base, ofs);
  251. else
  252. emit_tsi(as, irt_isnum(ir->t) ? MIPSI_LDC1 : MIPSI_LWC1,
  253. (r & 31), base, ofs);
  254. }
  255. /* Generic store of register with base and (small) offset address. */
  256. static void emit_storeofs(ASMState *as, IRIns *ir, Reg r, Reg base, int32_t ofs)
  257. {
  258. if (r < RID_MAX_GPR)
  259. emit_tsi(as, irt_is64(ir->t) ? MIPSI_SD : MIPSI_SW, r, base, ofs);
  260. else
  261. emit_tsi(as, irt_isnum(ir->t) ? MIPSI_SDC1 : MIPSI_SWC1,
  262. (r&31), base, ofs);
  263. }
  264. /* Add offset to pointer. */
  265. static void emit_addptr(ASMState *as, Reg r, int32_t ofs)
  266. {
  267. if (ofs) {
  268. lj_assertA(checki16(ofs), "offset %d out of range", ofs);
  269. emit_tsi(as, MIPSI_AADDIU, r, r, ofs);
  270. }
  271. }
  272. #define emit_spsub(as, ofs) emit_addptr(as, RID_SP, -(ofs))