ncpumat.pas 10 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298
  1. {
  2. David Zhang 2007/01/15
  3. $Id: ncpumat.pas,v 1.23 2005/02/14 17:13:10 peter Exp $
  4. Copyright (c) 1998-2002 by Florian Klaempfl
  5. Generate MIPSel assembler for math nodes
  6. This program is free software; you can redistribute it and/or modify
  7. it under the terms of the GNU General Public License as published by
  8. the Free Software Foundation; either version 2 of the License, or
  9. (at your option) any later version.
  10. This program is distributed in the hope that it will be useful,
  11. but WITHOUT ANY WARRANTY; without even the implied warranty of
  12. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  13. GNU General Public License for more details.
  14. You should have received a copy of the GNU General Public License
  15. along with this program; if not, write to the Free Software
  16. Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
  17. ****************************************************************************
  18. }
  19. unit ncpumat;
  20. {$i fpcdefs.inc}
  21. interface
  22. uses
  23. symtype,
  24. node, nmat, ncgmat, cgbase;
  25. type
  26. tMIPSELmoddivnode = class(tmoddivnode)
  27. procedure pass_generate_code;override;
  28. end;
  29. tMIPSELshlshrnode = class(tcgshlshrnode)
  30. procedure second_64bit;override;
  31. { everything will be handled in pass_2 }
  32. function first_shlshr64bitint: tnode; override;
  33. end;
  34. tMIPSELnotnode = class(tcgnotnode)
  35. procedure second_boolean; override;
  36. end;
  37. TMIPSunaryminusnode = class(tcgunaryminusnode)
  38. procedure second_float; override;
  39. end;
  40. implementation
  41. uses
  42. globtype, systems,
  43. cutils, verbose, globals,
  44. symconst, symdef,
  45. aasmbase, aasmcpu, aasmtai, aasmdata,
  46. defutil,
  47. procinfo,
  48. cgobj, hlcgobj, pass_2,
  49. ncon,
  50. cpubase,
  51. ncgutil, cgcpu, cgutils;
  52. {*****************************************************************************
  53. TMipselMODDIVNODE
  54. *****************************************************************************}
  55. const
  56. ops_div: array[boolean] of tasmop = (A_DIVU, A_DIV);
  57. procedure tMIPSELmoddivnode.pass_generate_code;
  58. var
  59. power: longint;
  60. tmpreg, numerator, divider: tregister;
  61. hl,hl2: tasmlabel;
  62. begin
  63. secondpass(left);
  64. secondpass(right);
  65. location_reset(location,LOC_REGISTER,def_cgsize(resultdef));
  66. location.register:=cg.GetIntRegister(current_asmdata.CurrAsmList,OS_INT);
  67. { put numerator in register }
  68. hlcg.location_force_reg(current_asmdata.CurrAsmList, left.location, left.resultdef, left.resultdef, True);
  69. numerator := left.location.Register;
  70. if (nodetype = divn) and
  71. (right.nodetype = ordconstn) then
  72. begin
  73. if ispowerof2(tordconstnode(right).Value.svalue, power) then
  74. begin
  75. tmpreg := cg.GetIntRegister(current_asmdata.CurrAsmList, OS_INT);
  76. cg.a_op_const_reg_reg(current_asmdata.CurrAsmList, OP_SAR, OS_INT, 31, numerator, tmpreg);
  77. { if signed, tmpreg=right value-1, otherwise 0 }
  78. cg.a_op_const_reg(current_asmdata.CurrAsmList, OP_AND, OS_INT, tordconstnode(right).Value.svalue - 1, tmpreg);
  79. { add left value }
  80. cg.a_op_reg_reg(current_asmdata.CurrAsmList, OP_ADD, OS_INT, numerator, tmpreg);
  81. cg.a_op_const_reg_reg(current_asmdata.CurrAsmList, OP_SAR, OS_INT, aword(power), tmpreg, location.register);
  82. end
  83. else
  84. cg.g_div_const_reg_reg(current_asmdata.CurrAsmList,def_cgsize(resultdef),
  85. tordconstnode(right).value.svalue,numerator,location.register);
  86. end
  87. else
  88. begin
  89. { load divider in a register if necessary }
  90. hlcg.location_force_reg(current_asmdata.CurrAsmList, right.location,
  91. right.resultdef, right.resultdef, True);
  92. divider := right.location.Register;
  93. { GAS performs division in delay slot:
  94. bne denom,$zero,.L1
  95. div $zero,numerator,denom
  96. break 7
  97. .L1:
  98. mflo result
  99. We can't yet do the same without prior fixing the spilling code:
  100. if registers require spilling, loads can be inserted before 'div',
  101. resulting in invalid code.
  102. }
  103. current_asmdata.CurrAsmList.Concat(taicpu.op_reg_reg_reg(ops_div[is_signed(resultdef)],NR_R0,numerator,divider));
  104. { Check for zero denominator, omit if dividing by constant (constants are checked earlier) }
  105. if (right.nodetype<>ordconstn) then
  106. begin
  107. current_asmdata.getjumplabel(hl);
  108. cg.a_cmp_reg_reg_label(current_asmdata.CurrAsmList,OS_INT,OC_NE,divider,NR_R0,hl);
  109. current_asmdata.CurrAsmList.Concat(taicpu.op_const(A_BREAK,7));
  110. cg.a_label(current_asmdata.CurrAsmList,hl);
  111. end;
  112. { Dividing low(longint) by -1 will overflow }
  113. if is_signed(right.resultdef) and (cs_check_overflow in current_settings.localswitches) then
  114. begin
  115. current_asmdata.getjumplabel(hl2);
  116. current_asmdata.CurrAsmList.concat(taicpu.op_reg_reg_const(A_ADDIU,NR_R1,NR_R0,-1));
  117. cg.a_cmp_reg_reg_label(current_asmdata.CurrAsmList,OS_INT,OC_NE,divider,NR_R1,hl2);
  118. current_asmdata.CurrAsmList.concat(taicpu.op_reg_const(A_LUI,NR_R1,$8000));
  119. cg.a_cmp_reg_reg_label(current_asmdata.CurrAsmList,OS_INT,OC_NE,numerator,NR_R1,hl2);
  120. current_asmdata.CurrAsmList.concat(taicpu.op_const(A_BREAK,6));
  121. cg.a_label(current_asmdata.CurrAsmList,hl2);
  122. end;
  123. if (nodetype=modn) then
  124. current_asmdata.CurrAsmList.concat(taicpu.op_reg(A_MFHI,location.register))
  125. else
  126. current_asmdata.CurrAsmList.concat(taicpu.op_reg(A_MFLO,location.register));
  127. end;
  128. end;
  129. {*****************************************************************************
  130. TMIPSelSHLRSHRNODE
  131. *****************************************************************************}
  132. function TMIPSELShlShrNode.first_shlshr64bitint: TNode;
  133. begin
  134. { 64bit without constants need a helper }
  135. if is_64bit(left.resultdef) and
  136. (right.nodetype <> ordconstn) then
  137. begin
  138. Result := inherited first_shlshr64bitint;
  139. exit;
  140. end;
  141. Result := nil;
  142. end;
  143. procedure tMIPSELshlshrnode.second_64bit;
  144. var
  145. hregister, hreg64hi, hreg64lo: tregister;
  146. op: topcg;
  147. shiftval: aword;
  148. const
  149. ops: array [boolean] of topcg = (OP_SHR,OP_SHL);
  150. begin
  151. { 64bit without constants need a helper, and is
  152. already replaced in pass1 }
  153. if (right.nodetype <> ordconstn) then
  154. internalerror(200405301);
  155. location_reset(location, LOC_REGISTER, def_cgsize(resultdef));
  156. { load left operator in a register }
  157. hlcg.location_force_reg(current_asmdata.CurrAsmList, left.location, left.resultdef, resultdef, true);
  158. hreg64hi := left.location.register64.reghi;
  159. hreg64lo := left.location.register64.reglo;
  160. shiftval := tordconstnode(right).Value.svalue and 63;
  161. op := ops[nodetype=shln];
  162. if shiftval > 31 then
  163. begin
  164. if nodetype = shln then
  165. begin
  166. location.register64.reglo:=NR_R0;
  167. location.register64.reghi:=cg.GetIntRegister(current_asmdata.CurrAsmList,OS_32);
  168. { if shiftval and 31 = 0, it will optimize to MOVE }
  169. cg.a_op_const_reg_reg(current_asmdata.CurrAsmList, OP_SHL, OS_32, shiftval and 31, hreg64lo, location.register64.reghi);
  170. end
  171. else
  172. begin
  173. location.register64.reghi:=NR_R0;
  174. location.register64.reglo:=cg.GetIntRegister(current_asmdata.CurrAsmList,OS_32);
  175. cg.a_op_const_reg_reg(current_asmdata.CurrAsmList, OP_SHR, OS_32, shiftval and 31, hreg64hi, location.register64.reglo);
  176. end;
  177. end
  178. else
  179. begin
  180. location.register64.reglo:=cg.GetIntRegister(current_asmdata.CurrAsmList,OS_32);
  181. location.register64.reghi:=cg.GetIntRegister(current_asmdata.CurrAsmList,OS_32);
  182. hregister := cg.getintregister(current_asmdata.CurrAsmList, OS_32);
  183. cg.a_op_const_reg_reg(current_asmdata.CurrAsmList, op, OS_32, shiftval, hreg64hi, location.register64.reghi);
  184. cg.a_op_const_reg_reg(current_asmdata.CurrAsmList, op, OS_32, shiftval, hreg64lo, location.register64.reglo);
  185. if shiftval <> 0 then
  186. begin
  187. if nodetype = shln then
  188. begin
  189. cg.a_op_const_reg_reg(current_asmdata.CurrAsmList, OP_SHR, OS_32, 32-shiftval, hreg64lo, hregister);
  190. cg.a_op_reg_reg_reg(current_asmdata.CurrAsmList, OP_OR, OS_32, hregister, location.register64.reghi, location.register64.reghi);
  191. end
  192. else
  193. begin
  194. cg.a_op_const_reg_reg(current_asmdata.CurrAsmList, OP_SHL, OS_32, 32-shiftval, hreg64hi, hregister);
  195. cg.a_op_reg_reg_reg(current_asmdata.CurrAsmList, OP_OR, OS_32, hregister, location.register64.reglo, location.register64.reglo);
  196. end;
  197. end;
  198. end;
  199. end;
  200. {*****************************************************************************
  201. TMIPSelNOTNODE
  202. *****************************************************************************}
  203. procedure tMIPSELnotnode.second_boolean;
  204. var
  205. tmpreg : TRegister;
  206. begin
  207. if not handle_locjump then
  208. begin
  209. secondpass(left);
  210. case left.location.loc of
  211. LOC_REGISTER, LOC_CREGISTER, LOC_REFERENCE, LOC_CREFERENCE,
  212. LOC_SUBSETREG,LOC_CSUBSETREG,LOC_SUBSETREF,LOC_CSUBSETREF:
  213. begin
  214. hlcg.location_force_reg(current_asmdata.CurrAsmList, left.location, left.resultdef, left.resultdef, True);
  215. location_reset(location,LOC_FLAGS,OS_NO);
  216. location.resflags.reg2:=NR_R0;
  217. location.resflags.cond:=OC_EQ;
  218. if is_64bit(resultdef) then
  219. begin
  220. tmpreg:=cg.GetIntRegister(current_asmdata.CurrAsmList,OS_INT);
  221. { OR low and high parts together }
  222. current_asmdata.CurrAsmList.concat(taicpu.op_reg_reg_reg(A_OR,tmpreg,left.location.register64.reglo,left.location.register64.reghi));
  223. location.resflags.reg1:=tmpreg;
  224. end
  225. else
  226. location.resflags.reg1:=left.location.register;
  227. end;
  228. else
  229. internalerror(2003042401);
  230. end;
  231. end;
  232. end;
  233. {*****************************************************************************
  234. TMIPSunaryminusnode
  235. *****************************************************************************}
  236. procedure TMIPSunaryminusnode.second_float;
  237. begin
  238. secondpass(left);
  239. hlcg.location_force_fpureg(current_asmdata.CurrAsmList,left.location,left.resultdef,true);
  240. location_reset(location,LOC_FPUREGISTER,def_cgsize(resultdef));
  241. location.register:=cg.getfpuregister(current_asmdata.CurrAsmList,location.size);
  242. case location.size of
  243. OS_F32:
  244. current_asmdata.CurrAsmList.concat(taicpu.op_reg_reg(A_NEG_s,location.register,left.location.register));
  245. OS_F64:
  246. current_asmdata.CurrAsmList.concat(taicpu.op_reg_reg(A_NEG_d,location.register,left.location.register));
  247. else
  248. internalerror(2013030501);
  249. end;
  250. end;
  251. begin
  252. cmoddivnode := tMIPSELmoddivnode;
  253. cshlshrnode := tMIPSELshlshrnode;
  254. cnotnode := tMIPSELnotnode;
  255. cunaryminusnode := TMIPSunaryminusnode;
  256. end.