ngppcadd.pas 20 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555
  1. {
  2. Copyright (c) 2000-2006 by Florian Klaempfl and Jonas Maebe
  3. Code generation for add nodes on the PowerPC (32 and 64 bit generic)
  4. This program is free software; you can redistribute it and/or modify
  5. it under the terms of the GNU General Public License as published by
  6. the Free Software Foundation; either version 2 of the License, or
  7. (at your option) any later version.
  8. This program is distributed in the hope that it will be useful,
  9. but WITHOUT ANY WARRANTY; without even the implied warranty of
  10. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  11. GNU General Public License for more details.
  12. You should have received a copy of the GNU General Public License
  13. along with this program; if not, write to the Free Software
  14. Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
  15. ****************************************************************************
  16. }
  17. unit ngppcadd;
  18. {$i fpcdefs.inc}
  19. interface
  20. uses
  21. node,nadd,ncgadd,cpubase;
  22. type
  23. tgenppcaddnode = class(tcgaddnode)
  24. function pass_1: tnode; override;
  25. protected
  26. procedure pass_left_and_right;
  27. procedure load_left_right(cmpop, load_constants: boolean);
  28. function getresflags : tresflags;
  29. procedure emit_compare(unsigned: boolean); virtual; abstract;
  30. procedure second_addfloat;override;
  31. procedure second_addboolean;override;
  32. procedure second_addsmallset;override;
  33. end;
  34. implementation
  35. {*****************************************************************************
  36. Pass 1
  37. *****************************************************************************}
  38. uses
  39. globtype,systems,
  40. cutils,verbose,globals,
  41. symconst,symdef,paramgr,
  42. aasmbase,aasmtai,aasmdata,aasmcpu,defutil,htypechk,
  43. cgbase,cpuinfo,pass_1,pass_2,regvars,
  44. cpupara,cgcpu,cgutils,procinfo,
  45. ncon,nset,
  46. ncgutil,tgobj,rgobj,rgcpu,cgobj,hlcgobj;
  47. {*****************************************************************************
  48. Pass 1
  49. *****************************************************************************}
  50. function tgenppcaddnode.pass_1: tnode;
  51. begin
  52. typecheckpass(left);
  53. if (nodetype in [equaln,unequaln]) and
  54. (left.resultdef.typ = orddef) and
  55. is_64bit(left.resultdef) then
  56. begin
  57. result := nil;
  58. firstpass(left);
  59. firstpass(right);
  60. expectloc := LOC_FLAGS;
  61. exit;
  62. end;
  63. result := inherited pass_1;
  64. end;
  65. {*****************************************************************************
  66. Helpers
  67. *****************************************************************************}
  68. procedure tgenppcaddnode.pass_left_and_right;
  69. begin
  70. { calculate the operator which is more difficult }
  71. firstcomplex(self);
  72. { in case of constant put it to the left }
  73. if (left.nodetype=ordconstn) then
  74. swapleftright;
  75. secondpass(left);
  76. secondpass(right);
  77. end;
  78. procedure tgenppcaddnode.load_left_right(cmpop, load_constants: boolean);
  79. procedure load_node(var n: tnode);
  80. begin
  81. case n.location.loc of
  82. LOC_REGISTER,
  83. LOC_CREGISTER:
  84. ;
  85. LOC_CONSTANT:
  86. begin
  87. if load_constants then
  88. hlcg.location_force_reg(current_asmdata.CurrAsmList,n.location,n.resultdef,n.resultdef,false);
  89. end;
  90. else
  91. hlcg.location_force_reg(current_asmdata.CurrAsmList,n.location,n.resultdef,n.resultdef,false);
  92. end;
  93. end;
  94. begin
  95. load_node(left);
  96. load_node(right);
  97. if not(cmpop) then
  98. begin
  99. location.register := cg.getintregister(current_asmdata.CurrAsmList,OS_INT);
  100. {$ifndef cpu64bitalu}
  101. if is_64bit(resultdef) then
  102. location.register64.reghi := cg.getintregister(current_asmdata.CurrAsmList,OS_INT);
  103. {$endif not cpu64bitalu}
  104. end;
  105. end;
  106. function tgenppcaddnode.getresflags : tresflags;
  107. begin
  108. if (left.resultdef.typ <> floatdef) then
  109. begin
  110. result.cr := RS_CR0;
  111. case nodetype of
  112. equaln : result.flag:=F_EQ;
  113. unequaln : result.flag:=F_NE;
  114. else
  115. if nf_swapped in flags then
  116. case nodetype of
  117. ltn : result.flag:=F_GT;
  118. lten : result.flag:=F_GE;
  119. gtn : result.flag:=F_LT;
  120. gten : result.flag:=F_LE;
  121. end
  122. else
  123. case nodetype of
  124. ltn : result.flag:=F_LT;
  125. lten : result.flag:=F_LE;
  126. gtn : result.flag:=F_GT;
  127. gten : result.flag:=F_GE;
  128. end;
  129. end
  130. end
  131. else
  132. begin
  133. result.cr := RS_CR1;
  134. if (nodetype=equaln) then
  135. result.flag:=F_EQ
  136. else if (nodetype=unequaln) then
  137. result.flag:=F_NE
  138. else if (nf_swapped in flags) then
  139. case nodetype of
  140. ltn : result.flag:=F_FA;
  141. lten : result.flag:=F_FAE;
  142. gtn : result.flag:=F_FB;
  143. gten : result.flag:=F_FBE;
  144. else
  145. internalerror(2014031902);
  146. end
  147. else
  148. case nodetype of
  149. ltn : result.flag:=F_FB;
  150. lten : result.flag:=F_FBE;
  151. gtn : result.flag:=F_FA;
  152. gten : result.flag:=F_FAE;
  153. else
  154. internalerror(2014031903);
  155. end;
  156. end;
  157. end;
  158. {*****************************************************************************
  159. AddBoolean
  160. *****************************************************************************}
  161. procedure tgenppcaddnode.second_addboolean;
  162. var
  163. cgop : TOpCg;
  164. cgsize : TCgSize;
  165. cmpop : boolean;
  166. begin
  167. { calculate the operator which is more difficult }
  168. firstcomplex(self);
  169. cmpop:=false;
  170. if (torddef(left.resultdef).ordtype in [pasbool8,bool8bit]) or
  171. (torddef(right.resultdef).ordtype in [pasbool8,bool8bit]) then
  172. cgsize:=OS_8
  173. else if (torddef(left.resultdef).ordtype in [pasbool16,bool16bit]) or
  174. (torddef(right.resultdef).ordtype in [pasbool16,bool16bit]) then
  175. cgsize:=OS_16
  176. else if (torddef(left.resultdef).ordtype in [pasbool32,bool32bit]) or
  177. (torddef(right.resultdef).ordtype in [pasbool32,bool32bit]) then
  178. cgsize:=OS_32
  179. else
  180. cgsize:=OS_64;
  181. if {$ifndef cpu64bitalu}(cgsize<>OS_64) and{$endif}
  182. (((cs_full_boolean_eval in current_settings.localswitches) and
  183. not(nf_short_bool in flags)) or
  184. (nodetype in [unequaln,ltn,lten,gtn,gten,equaln,xorn])) then
  185. begin
  186. if left.nodetype in [ordconstn,realconstn] then
  187. swapleftright;
  188. secondpass(left);
  189. if (left.expectloc=LOC_JUMP)<>
  190. (left.location.loc=LOC_JUMP) then
  191. internalerror(2003122901);
  192. if left.location.loc in [LOC_FLAGS,LOC_JUMP] then
  193. hlcg.location_force_reg(current_asmdata.CurrAsmList,left.location,left.resultdef,cgsize_orddef(cgsize),false);
  194. secondpass(right);
  195. if (right.expectloc=LOC_JUMP)<>
  196. (right.location.loc=LOC_JUMP) then
  197. internalerror(200312292);
  198. if right.location.loc in [LOC_FLAGS,LOC_JUMP] then
  199. hlcg.location_force_reg(current_asmdata.CurrAsmList,right.location,right.resultdef,cgsize_orddef(cgsize),false);
  200. cmpop := nodetype in [ltn,lten,gtn,gten,equaln,unequaln];
  201. { set result location }
  202. if not cmpop then
  203. location_reset(location,LOC_REGISTER,def_cgsize(resultdef))
  204. else
  205. location_reset(location,LOC_FLAGS,OS_NO);
  206. load_left_right(cmpop,false);
  207. if (left.location.loc = LOC_CONSTANT) then
  208. swapleftright;
  209. { compare the }
  210. case nodetype of
  211. ltn,lten,gtn,gten,
  212. equaln,unequaln :
  213. begin
  214. if (right.location.loc <> LOC_CONSTANT) then
  215. current_asmdata.CurrAsmList.concat(taicpu.op_reg_reg(A_CMPLW,
  216. left.location.register,right.location.register))
  217. else
  218. current_asmdata.CurrAsmList.concat(taicpu.op_reg_const(A_CMPLWI,
  219. left.location.register,longint(right.location.value)));
  220. location.resflags := getresflags;
  221. end;
  222. else
  223. begin
  224. case nodetype of
  225. xorn :
  226. cgop:=OP_XOR;
  227. orn :
  228. cgop:=OP_OR;
  229. andn :
  230. cgop:=OP_AND;
  231. else
  232. internalerror(200203247);
  233. end;
  234. if right.location.loc <> LOC_CONSTANT then
  235. cg.a_op_reg_reg_reg(current_asmdata.CurrAsmList,cgop,OS_INT,
  236. left.location.register,right.location.register,
  237. location.register)
  238. else
  239. cg.a_op_const_reg_reg(current_asmdata.CurrAsmList,cgop,OS_INT,
  240. right.location.value,left.location.register,
  241. location.register);
  242. end;
  243. end;
  244. end
  245. else
  246. inherited second_addboolean;
  247. end;
  248. {*****************************************************************************
  249. AddFloat
  250. *****************************************************************************}
  251. procedure tgenppcaddnode.second_addfloat;
  252. var
  253. op : TAsmOp;
  254. cmpop,
  255. singleprec : boolean;
  256. begin
  257. pass_left_and_right;
  258. cmpop:=false;
  259. singleprec:=tfloatdef(left.resultdef).floattype=s32real;
  260. case nodetype of
  261. addn :
  262. if singleprec then
  263. op:=A_FADDS
  264. else
  265. op:=A_FADD;
  266. muln :
  267. if singleprec then
  268. op:=A_FMULS
  269. else
  270. op:=A_FMUL;
  271. subn :
  272. if singleprec then
  273. op:=A_FSUBS
  274. else
  275. op:=A_FSUB;
  276. slashn :
  277. if singleprec then
  278. op:=A_FDIVS
  279. else
  280. op:=A_FDIV;
  281. ltn,lten,gtn,gten,
  282. equaln,unequaln :
  283. begin
  284. op:=A_FCMPO;
  285. cmpop:=true;
  286. end;
  287. else
  288. internalerror(200403182);
  289. end;
  290. // get the operands in the correct order, there are no special cases
  291. // here, everything is register-based
  292. if nf_swapped in flags then
  293. swapleftright;
  294. // put both operands in a register
  295. hlcg.location_force_fpureg(current_asmdata.CurrAsmList,right.location,right.resultdef,true);
  296. hlcg.location_force_fpureg(current_asmdata.CurrAsmList,left.location,left.resultdef,true);
  297. // initialize de result
  298. if not cmpop then
  299. begin
  300. location_reset(location,LOC_FPUREGISTER,def_cgsize(resultdef));
  301. location.register := cg.getfpuregister(current_asmdata.CurrAsmList,location.size);
  302. end
  303. else
  304. begin
  305. location_reset(location,LOC_FLAGS,OS_NO);
  306. location.resflags := getresflags;
  307. end;
  308. // emit the actual operation
  309. if not cmpop then
  310. begin
  311. current_asmdata.CurrAsmList.concat(taicpu.op_reg_reg_reg(op,
  312. location.register,left.location.register,
  313. right.location.register))
  314. end
  315. else
  316. begin
  317. current_asmdata.CurrAsmList.concat(taicpu.op_reg_reg_reg(op,
  318. newreg(R_SPECIALREGISTER,location.resflags.cr,R_SUBNONE),left.location.register,right.location.register))
  319. end;
  320. end;
  321. {*****************************************************************************
  322. AddSmallSet
  323. *****************************************************************************}
  324. procedure tgenppcaddnode.second_addsmallset;
  325. var
  326. cgop : TOpCg;
  327. setbase: aint;
  328. tmpreg : tregister;
  329. opdone,
  330. cmpop : boolean;
  331. begin
  332. if target_info.endian=endian_little then
  333. begin
  334. { this code currently assumes big endian }
  335. if (left.nodetype=setelementn) or (right.nodetype=setelementn) then
  336. begin
  337. inherited second_addsmallsetelement;
  338. exit;
  339. end
  340. end;
  341. cgop:=OP_None;
  342. pass_left_and_right;
  343. { when a setdef is passed, it has to be a smallset }
  344. if (not(nf_swapped in flags) and
  345. not is_smallset(left.resultdef) or
  346. (not is_smallset(right.resultdef) and
  347. (right.nodetype<>setelementn))) or
  348. ((nf_swapped in flags) and
  349. not is_smallset(right.resultdef) or
  350. (not is_smallset(left.resultdef) and
  351. (left.nodetype<>setelementn))) then
  352. internalerror(200203359);
  353. opdone := false;
  354. cmpop:=nodetype in [equaln,unequaln,lten,gten];
  355. { set result location }
  356. if not cmpop then
  357. location_reset(location,LOC_REGISTER,def_cgsize(resultdef))
  358. else
  359. location_reset(location,LOC_FLAGS,OS_NO);
  360. load_left_right(cmpop,false);
  361. if not(cmpop) then
  362. location.register := cg.getintregister(current_asmdata.CurrAsmList,OS_INT);
  363. if (left.resultdef.typ=setdef) then
  364. setbase:=tsetdef(left.resultdef).setbase
  365. else
  366. setbase:=tsetdef(right.resultdef).setbase;
  367. if (nf_swapped in flags) and
  368. ((nodetype=subn) or
  369. (left.nodetype=setelementn)) then
  370. swapleftright;
  371. { we don't support two constant locations (should ideally be handled
  372. in simplify }
  373. if (left.location.loc=LOC_CONSTANT) and
  374. (right.location.loc=LOC_CONSTANT) then
  375. hlcg.location_force_reg(current_asmdata.CurrAsmList,left.location,left.resultdef,left.resultdef,true);
  376. case nodetype of
  377. addn :
  378. begin
  379. { are we adding set elements ? }
  380. if right.nodetype=setelementn then
  381. begin
  382. { no range support for smallsets! }
  383. if assigned(tsetelementnode(right).right) then
  384. internalerror(43244);
  385. if (right.location.loc = LOC_CONSTANT) then
  386. cg.a_op_const_reg_reg(current_asmdata.CurrAsmList,OP_OR,OS_INT,
  387. aint((aword(1) shl (resultdef.size*8-1)) shr aword(right.location.value-setbase)),
  388. left.location.register,location.register)
  389. else
  390. begin
  391. tmpreg := cg.getintregister(current_asmdata.CurrAsmList,OS_INT);
  392. cg.a_load_const_reg(current_asmdata.CurrAsmList,OS_INT,aint((aword(1) shl (resultdef.size*8-1))),tmpreg);
  393. register_maybe_adjust_setbase(current_asmdata.CurrAsmList,right.location,setbase);
  394. cg.a_op_reg_reg(current_asmdata.CurrAsmList,OP_SHR,OS_INT,
  395. right.location.register,tmpreg);
  396. if left.location.loc <> LOC_CONSTANT then
  397. cg.a_op_reg_reg_reg(current_asmdata.CurrAsmList,OP_OR,OS_INT,tmpreg,
  398. left.location.register,location.register)
  399. else
  400. cg.a_op_const_reg_reg(current_asmdata.CurrAsmList,OP_OR,OS_INT,
  401. left.location.value,tmpreg,location.register);
  402. end;
  403. opdone := true;
  404. end
  405. else
  406. cgop := OP_OR;
  407. end;
  408. symdifn :
  409. cgop:=OP_XOR;
  410. muln :
  411. cgop:=OP_AND;
  412. subn :
  413. begin
  414. cgop:=OP_AND;
  415. if (right.location.loc=LOC_CONSTANT) then
  416. right.location.value := not(right.location.value)
  417. else
  418. opdone := true;
  419. if opdone then
  420. begin
  421. if left.location.loc = LOC_CONSTANT then
  422. begin
  423. tmpreg := cg.getintregister(current_asmdata.CurrAsmList,OS_INT);
  424. cg.a_load_const_reg(current_asmdata.CurrAsmList,OS_INT,
  425. left.location.value,tmpreg);
  426. current_asmdata.CurrAsmList.concat(taicpu.op_reg_reg_reg(A_ANDC,
  427. location.register,tmpreg,right.location.register));
  428. end
  429. else
  430. current_asmdata.CurrAsmList.concat(taicpu.op_reg_reg_reg(A_ANDC,
  431. location.register,left.location.register,
  432. right.location.register));
  433. end;
  434. end;
  435. equaln,
  436. unequaln :
  437. begin
  438. emit_compare(true);
  439. opdone := true;
  440. end;
  441. lten,gten:
  442. begin
  443. If (not(nf_swapped in flags) and
  444. (nodetype = lten)) or
  445. ((nf_swapped in flags) and
  446. (nodetype = gten)) then
  447. swapleftright;
  448. // now we have to check whether left >= right
  449. tmpreg := cg.getintregister(current_asmdata.CurrAsmList,OS_INT);
  450. if left.location.loc = LOC_CONSTANT then
  451. begin
  452. cg.a_op_const_reg_reg(current_asmdata.CurrAsmList,OP_AND,OS_INT,
  453. not(left.location.value),right.location.register,tmpreg);
  454. current_asmdata.CurrAsmList.concat(taicpu.op_reg_const(A_CMPWI,tmpreg,0));
  455. // the two instructions above should be folded together by
  456. // the peepholeoptimizer
  457. end
  458. else
  459. begin
  460. if right.location.loc = LOC_CONSTANT then
  461. begin
  462. cg.a_load_const_reg(current_asmdata.CurrAsmList,OS_INT,
  463. right.location.value,tmpreg);
  464. current_asmdata.CurrAsmList.concat(taicpu.op_reg_reg_reg(A_ANDC_,tmpreg,
  465. tmpreg,left.location.register));
  466. end
  467. else
  468. current_asmdata.CurrAsmList.concat(taicpu.op_reg_reg_reg(A_ANDC_,tmpreg,
  469. right.location.register,left.location.register));
  470. end;
  471. location.resflags.cr := RS_CR0;
  472. location.resflags.flag := F_EQ;
  473. opdone := true;
  474. end;
  475. else
  476. internalerror(2002072701);
  477. end;
  478. if not opdone then
  479. begin
  480. // these are all commutative operations
  481. if (left.location.loc = LOC_CONSTANT) then
  482. swapleftright;
  483. if (right.location.loc = LOC_CONSTANT) then
  484. cg.a_op_const_reg_reg(current_asmdata.CurrAsmList,cgop,OS_INT,
  485. right.location.value,left.location.register,
  486. location.register)
  487. else
  488. cg.a_op_reg_reg_reg(current_asmdata.CurrAsmList,cgop,OS_INT,
  489. right.location.register,left.location.register,
  490. location.register);
  491. end;
  492. end;
  493. end.