ncpumat.pas 10 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297
  1. {
  2. David Zhang 2007/01/15
  3. $Id: ncpumat.pas,v 1.23 2005/02/14 17:13:10 peter Exp $
  4. Copyright (c) 1998-2002 by Florian Klaempfl
  5. Generate MIPSel assembler for math nodes
  6. This program is free software; you can redistribute it and/or modify
  7. it under the terms of the GNU General Public License as published by
  8. the Free Software Foundation; either version 2 of the License, or
  9. (at your option) any later version.
  10. This program is distributed in the hope that it will be useful,
  11. but WITHOUT ANY WARRANTY; without even the implied warranty of
  12. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  13. GNU General Public License for more details.
  14. You should have received a copy of the GNU General Public License
  15. along with this program; if not, write to the Free Software
  16. Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
  17. ****************************************************************************
  18. }
  19. unit ncpumat;
  20. {$i fpcdefs.inc}
  21. interface
  22. uses
  23. node, nmat, ncgmat, cgbase;
  24. type
  25. tMIPSELmoddivnode = class(tmoddivnode)
  26. procedure pass_generate_code;override;
  27. end;
  28. tMIPSELshlshrnode = class(tcgshlshrnode)
  29. procedure second_64bit;override;
  30. { everything will be handled in pass_2 }
  31. function first_shlshr64bitint: tnode; override;
  32. end;
  33. tMIPSELnotnode = class(tcgnotnode)
  34. procedure second_boolean; override;
  35. end;
  36. TMIPSunaryminusnode = class(tcgunaryminusnode)
  37. procedure second_float; override;
  38. end;
  39. implementation
  40. uses
  41. globtype, systems,
  42. cutils, verbose, globals,
  43. symconst, symdef,
  44. aasmbase, aasmcpu, aasmtai, aasmdata,
  45. defutil,
  46. procinfo,
  47. cgobj, hlcgobj, pass_2,
  48. ncon,
  49. cpubase,
  50. ncgutil, cgcpu, cgutils;
  51. {*****************************************************************************
  52. TMipselMODDIVNODE
  53. *****************************************************************************}
  54. const
  55. ops_div: array[boolean] of tasmop = (A_DIVU, A_DIV);
  56. procedure tMIPSELmoddivnode.pass_generate_code;
  57. var
  58. power: longint;
  59. tmpreg, numerator, divider: tregister;
  60. hl,hl2: tasmlabel;
  61. begin
  62. secondpass(left);
  63. secondpass(right);
  64. location_reset(location,LOC_REGISTER,def_cgsize(resultdef));
  65. location.register:=cg.GetIntRegister(current_asmdata.CurrAsmList,OS_INT);
  66. { put numerator in register }
  67. hlcg.location_force_reg(current_asmdata.CurrAsmList, left.location, left.resultdef, left.resultdef, True);
  68. numerator := left.location.Register;
  69. if (nodetype = divn) and
  70. (right.nodetype = ordconstn) then
  71. begin
  72. if ispowerof2(tordconstnode(right).Value.svalue, power) then
  73. begin
  74. tmpreg := cg.GetIntRegister(current_asmdata.CurrAsmList, OS_INT);
  75. cg.a_op_const_reg_reg(current_asmdata.CurrAsmList, OP_SAR, OS_INT, 31, numerator, tmpreg);
  76. { if signed, tmpreg=right value-1, otherwise 0 }
  77. cg.a_op_const_reg(current_asmdata.CurrAsmList, OP_AND, OS_INT, tordconstnode(right).Value.svalue - 1, tmpreg);
  78. { add left value }
  79. cg.a_op_reg_reg(current_asmdata.CurrAsmList, OP_ADD, OS_INT, numerator, tmpreg);
  80. cg.a_op_const_reg_reg(current_asmdata.CurrAsmList, OP_SAR, OS_INT, aword(power), tmpreg, location.register);
  81. end
  82. else
  83. cg.g_div_const_reg_reg(current_asmdata.CurrAsmList,def_cgsize(resultdef),
  84. tordconstnode(right).value.svalue,numerator,location.register);
  85. end
  86. else
  87. begin
  88. { load divider in a register if necessary }
  89. hlcg.location_force_reg(current_asmdata.CurrAsmList, right.location,
  90. right.resultdef, right.resultdef, True);
  91. divider := right.location.Register;
  92. { GAS performs division in delay slot:
  93. bne denom,$zero,.L1
  94. div $zero,numerator,denom
  95. break 7
  96. .L1:
  97. mflo result
  98. We can't yet do the same without prior fixing the spilling code:
  99. if registers require spilling, loads can be inserted before 'div',
  100. resulting in invalid code.
  101. }
  102. current_asmdata.CurrAsmList.Concat(taicpu.op_reg_reg_reg(ops_div[is_signed(resultdef)],NR_R0,numerator,divider));
  103. { Check for zero denominator, omit if dividing by constant (constants are checked earlier) }
  104. if (right.nodetype<>ordconstn) then
  105. begin
  106. current_asmdata.getjumplabel(hl);
  107. cg.a_cmp_reg_reg_label(current_asmdata.CurrAsmList,OS_INT,OC_NE,divider,NR_R0,hl);
  108. current_asmdata.CurrAsmList.Concat(taicpu.op_const(A_BREAK,7));
  109. cg.a_label(current_asmdata.CurrAsmList,hl);
  110. end;
  111. { Dividing low(longint) by -1 will overflow }
  112. if is_signed(right.resultdef) and (cs_check_overflow in current_settings.localswitches) then
  113. begin
  114. current_asmdata.getjumplabel(hl2);
  115. current_asmdata.CurrAsmList.concat(taicpu.op_reg_reg_const(A_ADDIU,NR_R1,NR_R0,-1));
  116. cg.a_cmp_reg_reg_label(current_asmdata.CurrAsmList,OS_INT,OC_NE,divider,NR_R1,hl2);
  117. current_asmdata.CurrAsmList.concat(taicpu.op_reg_const(A_LUI,NR_R1,$8000));
  118. cg.a_cmp_reg_reg_label(current_asmdata.CurrAsmList,OS_INT,OC_NE,numerator,NR_R1,hl2);
  119. current_asmdata.CurrAsmList.concat(taicpu.op_const(A_BREAK,6));
  120. cg.a_label(current_asmdata.CurrAsmList,hl2);
  121. end;
  122. if (nodetype=modn) then
  123. current_asmdata.CurrAsmList.concat(taicpu.op_reg(A_MFHI,location.register))
  124. else
  125. current_asmdata.CurrAsmList.concat(taicpu.op_reg(A_MFLO,location.register));
  126. end;
  127. end;
  128. {*****************************************************************************
  129. TMIPSelSHLRSHRNODE
  130. *****************************************************************************}
  131. function TMIPSELShlShrNode.first_shlshr64bitint: TNode;
  132. begin
  133. { 64bit without constants need a helper }
  134. if is_64bit(left.resultdef) and
  135. (right.nodetype <> ordconstn) then
  136. begin
  137. Result := inherited first_shlshr64bitint;
  138. exit;
  139. end;
  140. Result := nil;
  141. end;
  142. procedure tMIPSELshlshrnode.second_64bit;
  143. var
  144. hregister, hreg64hi, hreg64lo: tregister;
  145. op: topcg;
  146. shiftval: aword;
  147. const
  148. ops: array [boolean] of topcg = (OP_SHR,OP_SHL);
  149. begin
  150. { 64bit without constants need a helper, and is
  151. already replaced in pass1 }
  152. if (right.nodetype <> ordconstn) then
  153. internalerror(200405301);
  154. location_reset(location, LOC_REGISTER, def_cgsize(resultdef));
  155. { load left operator in a register }
  156. hlcg.location_force_reg(current_asmdata.CurrAsmList, left.location, left.resultdef, resultdef, true);
  157. hreg64hi := left.location.register64.reghi;
  158. hreg64lo := left.location.register64.reglo;
  159. shiftval := tordconstnode(right).Value.svalue and 63;
  160. op := ops[nodetype=shln];
  161. if shiftval > 31 then
  162. begin
  163. if nodetype = shln then
  164. begin
  165. location.register64.reglo:=NR_R0;
  166. location.register64.reghi:=cg.GetIntRegister(current_asmdata.CurrAsmList,OS_32);
  167. { if shiftval and 31 = 0, it will optimize to MOVE }
  168. cg.a_op_const_reg_reg(current_asmdata.CurrAsmList, OP_SHL, OS_32, shiftval and 31, hreg64lo, location.register64.reghi);
  169. end
  170. else
  171. begin
  172. location.register64.reghi:=NR_R0;
  173. location.register64.reglo:=cg.GetIntRegister(current_asmdata.CurrAsmList,OS_32);
  174. cg.a_op_const_reg_reg(current_asmdata.CurrAsmList, OP_SHR, OS_32, shiftval and 31, hreg64hi, location.register64.reglo);
  175. end;
  176. end
  177. else
  178. begin
  179. location.register64.reglo:=cg.GetIntRegister(current_asmdata.CurrAsmList,OS_32);
  180. location.register64.reghi:=cg.GetIntRegister(current_asmdata.CurrAsmList,OS_32);
  181. hregister := cg.getintregister(current_asmdata.CurrAsmList, OS_32);
  182. cg.a_op_const_reg_reg(current_asmdata.CurrAsmList, op, OS_32, shiftval, hreg64hi, location.register64.reghi);
  183. cg.a_op_const_reg_reg(current_asmdata.CurrAsmList, op, OS_32, shiftval, hreg64lo, location.register64.reglo);
  184. if shiftval <> 0 then
  185. begin
  186. if nodetype = shln then
  187. begin
  188. cg.a_op_const_reg_reg(current_asmdata.CurrAsmList, OP_SHR, OS_32, 32-shiftval, hreg64lo, hregister);
  189. cg.a_op_reg_reg_reg(current_asmdata.CurrAsmList, OP_OR, OS_32, hregister, location.register64.reghi, location.register64.reghi);
  190. end
  191. else
  192. begin
  193. cg.a_op_const_reg_reg(current_asmdata.CurrAsmList, OP_SHL, OS_32, 32-shiftval, hreg64hi, hregister);
  194. cg.a_op_reg_reg_reg(current_asmdata.CurrAsmList, OP_OR, OS_32, hregister, location.register64.reglo, location.register64.reglo);
  195. end;
  196. end;
  197. end;
  198. end;
  199. {*****************************************************************************
  200. TMIPSelNOTNODE
  201. *****************************************************************************}
  202. procedure tMIPSELnotnode.second_boolean;
  203. var
  204. tmpreg : TRegister;
  205. begin
  206. if not handle_locjump then
  207. begin
  208. secondpass(left);
  209. case left.location.loc of
  210. LOC_REGISTER, LOC_CREGISTER, LOC_REFERENCE, LOC_CREFERENCE,
  211. LOC_SUBSETREG,LOC_CSUBSETREG,LOC_SUBSETREF,LOC_CSUBSETREF:
  212. begin
  213. hlcg.location_force_reg(current_asmdata.CurrAsmList, left.location, left.resultdef, left.resultdef, True);
  214. location_reset(location,LOC_FLAGS,OS_NO);
  215. location.resflags.reg2:=NR_R0;
  216. location.resflags.cond:=OC_EQ;
  217. if is_64bit(resultdef) then
  218. begin
  219. tmpreg:=cg.GetIntRegister(current_asmdata.CurrAsmList,OS_INT);
  220. { OR low and high parts together }
  221. current_asmdata.CurrAsmList.concat(taicpu.op_reg_reg_reg(A_OR,tmpreg,left.location.register64.reglo,left.location.register64.reghi));
  222. location.resflags.reg1:=tmpreg;
  223. end
  224. else
  225. location.resflags.reg1:=left.location.register;
  226. end;
  227. else
  228. internalerror(2003042401);
  229. end;
  230. end;
  231. end;
  232. {*****************************************************************************
  233. TMIPSunaryminusnode
  234. *****************************************************************************}
  235. procedure TMIPSunaryminusnode.second_float;
  236. begin
  237. secondpass(left);
  238. hlcg.location_force_fpureg(current_asmdata.CurrAsmList,left.location,left.resultdef,true);
  239. location_reset(location,LOC_FPUREGISTER,def_cgsize(resultdef));
  240. location.register:=cg.getfpuregister(current_asmdata.CurrAsmList,location.size);
  241. case location.size of
  242. OS_F32:
  243. current_asmdata.CurrAsmList.concat(taicpu.op_reg_reg(A_NEG_s,location.register,left.location.register));
  244. OS_F64:
  245. current_asmdata.CurrAsmList.concat(taicpu.op_reg_reg(A_NEG_d,location.register,left.location.register));
  246. else
  247. internalerror(2013030501);
  248. end;
  249. end;
  250. begin
  251. cmoddivnode := tMIPSELmoddivnode;
  252. cshlshrnode := tMIPSELshlshrnode;
  253. cnotnode := tMIPSELnotnode;
  254. cunaryminusnode := TMIPSunaryminusnode;
  255. end.