cg386mat.pas 45 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044
  1. {
  2. $Id$
  3. Copyright (c) 1993-98 by Florian Klaempfl
  4. Generate i386 assembler for math nodes
  5. This program is free software; you can redistribute it and/or modify
  6. it under the terms of the GNU General Public License as published by
  7. the Free Software Foundation; either version 2 of the License, or
  8. (at your option) any later version.
  9. This program is distributed in the hope that it will be useful,
  10. but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  12. GNU General Public License for more details.
  13. You should have received a copy of the GNU General Public License
  14. along with this program; if not, write to the Free Software
  15. Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
  16. ****************************************************************************
  17. }
  18. unit cg386mat;
  19. interface
  20. uses
  21. tree;
  22. procedure secondmoddiv(var p : ptree);
  23. procedure secondshlshr(var p : ptree);
  24. procedure secondumminus(var p : ptree);
  25. procedure secondnot(var p : ptree);
  26. implementation
  27. uses
  28. globtype,systems,
  29. cobjects,verbose,globals,
  30. symtable,aasm,types,
  31. hcodegen,temp_gen,pass_2,
  32. i386base,i386asm,
  33. {$ifdef dummy}
  34. end { this overcomes the annoying highlighting problem in my TP IDE,
  35. the IDE assumes i386asm start a asm block (FK) }
  36. {$endif}
  37. cgai386,tgeni386;
  38. {*****************************************************************************
  39. SecondModDiv
  40. *****************************************************************************}
  41. procedure secondmoddiv(var p : ptree);
  42. var
  43. hreg1 : tregister;
  44. shrdiv, andmod, pushed,popeax,popedx : boolean;
  45. power : longint;
  46. hl : pasmlabel;
  47. hloc : tlocation;
  48. pushedreg : tpushed;
  49. typename,opname : string[6];
  50. begin
  51. shrdiv := false;
  52. andmod := false;
  53. secondpass(p^.left);
  54. set_location(p^.location,p^.left^.location);
  55. pushed:=maybe_push(p^.right^.registers32,p,is_64bitint(p^.left^.resulttype));
  56. secondpass(p^.right);
  57. if pushed then restore(p,is_64bitint(p^.left^.resulttype));
  58. if is_64bitint(p^.resulttype) then
  59. begin
  60. { save p^.lcoation, because we change it now }
  61. set_location(hloc,p^.location);
  62. release_qword_loc(p^.location);
  63. release_qword_loc(p^.right^.location);
  64. p^.location.registerlow:=getexplicitregister32(R_EAX);
  65. p^.location.registerhigh:=getexplicitregister32(R_EDX);
  66. pushusedregisters(pushedreg,$ff
  67. and not($80 shr byte(p^.location.registerlow))
  68. and not($80 shr byte(p^.location.registerhigh)));
  69. if cs_check_overflow in aktlocalswitches then
  70. push_int(1)
  71. else
  72. push_int(0);
  73. { the left operand is in hloc, because the
  74. location of left is p^.location but p^.location
  75. is already destroyed
  76. }
  77. emit_pushq_loc(hloc);
  78. clear_location(hloc);
  79. emit_pushq_loc(p^.right^.location);
  80. if porddef(p^.resulttype)^.typ=u64bit then
  81. typename:='QWORD'
  82. else
  83. typename:='INT64';
  84. if p^.treetype=divn then
  85. opname:='DIV_'
  86. else
  87. opname:='MOD_';
  88. emitcall('FPC_'+opname+typename);
  89. emit_reg_reg(A_MOV,S_L,R_EAX,p^.location.registerlow);
  90. emit_reg_reg(A_MOV,S_L,R_EDX,p^.location.registerhigh);
  91. popusedregisters(pushedreg);
  92. p^.location.loc:=LOC_REGISTER;
  93. end
  94. else
  95. begin
  96. { put numerator in register }
  97. if p^.left^.location.loc<>LOC_REGISTER then
  98. begin
  99. if p^.left^.location.loc=LOC_CREGISTER then
  100. begin
  101. hreg1:=getregister32;
  102. emit_reg_reg(A_MOV,S_L,p^.left^.location.register,hreg1);
  103. end
  104. else
  105. begin
  106. del_reference(p^.left^.location.reference);
  107. hreg1:=getregister32;
  108. exprasmlist^.concat(new(pai386,op_ref_reg(A_MOV,S_L,newreference(p^.left^.location.reference),
  109. hreg1)));
  110. end;
  111. clear_location(p^.left^.location);
  112. p^.left^.location.loc:=LOC_REGISTER;
  113. p^.left^.location.register:=hreg1;
  114. end
  115. else hreg1:=p^.left^.location.register;
  116. if (p^.treetype=divn) and (p^.right^.treetype=ordconstn) and
  117. ispowerof2(p^.right^.value,power) then
  118. Begin
  119. shrdiv := true;
  120. {for signed numbers, the numerator must be adjusted before the
  121. shift instruction, but not wih unsigned numbers! Otherwise,
  122. "Cardinal($ffffffff) div 16" overflows! (JM)}
  123. If is_signed(p^.left^.resulttype) Then
  124. Begin
  125. exprasmlist^.concat(new(pai386,op_reg_reg(A_OR,S_L,hreg1,hreg1)));
  126. getlabel(hl);
  127. emitjmp(C_NS,hl);
  128. if power=1 then
  129. exprasmlist^.concat(new(pai386,op_reg(A_INC,S_L,hreg1)))
  130. else
  131. exprasmlist^.concat(new(pai386,op_const_reg(A_ADD,S_L,p^.right^.value-1,hreg1)));
  132. emitlab(hl);
  133. exprasmlist^.concat(new(pai386,op_const_reg(A_SAR,S_L,power,hreg1)));
  134. End
  135. Else
  136. exprasmlist^.concat(new(pai386,op_const_reg(A_SHR,S_L,power,hreg1)));
  137. End
  138. else
  139. if (p^.treetype=modn) and (p^.right^.treetype=ordconstn) and
  140. ispowerof2(p^.right^.value,power) and Not(is_signed(p^.left^.resulttype)) Then
  141. {is there a similar trick for MOD'ing signed numbers? (JM)}
  142. Begin
  143. exprasmlist^.concat(new(pai386,op_const_reg(A_AND,S_L,p^.right^.value-1,hreg1)));
  144. andmod := true;
  145. End
  146. else
  147. begin
  148. { bring denominator to EDI }
  149. { EDI is always free, it's }
  150. { only used for temporary }
  151. { purposes }
  152. if (p^.right^.location.loc<>LOC_REGISTER) and
  153. (p^.right^.location.loc<>LOC_CREGISTER) then
  154. begin
  155. del_reference(p^.right^.location.reference);
  156. p^.left^.location.loc:=LOC_REGISTER;
  157. exprasmlist^.concat(new(pai386,op_ref_reg(A_MOV,S_L,newreference(p^.right^.location.reference),R_EDI)));
  158. end
  159. else
  160. begin
  161. emit_reg_reg(A_MOV,S_L,p^.right^.location.register,R_EDI);
  162. ungetregister32(p^.right^.location.register);
  163. end;
  164. popedx:=false;
  165. popeax:=false;
  166. if hreg1=R_EDX then
  167. begin
  168. if not(R_EAX in unused) then
  169. begin
  170. exprasmlist^.concat(new(pai386,op_reg(A_PUSH,S_L,R_EAX)));
  171. popeax:=true;
  172. end;
  173. emit_reg_reg(A_MOV,S_L,R_EDX,R_EAX);
  174. end
  175. else
  176. begin
  177. if not(R_EDX in unused) then
  178. begin
  179. exprasmlist^.concat(new(pai386,op_reg(A_PUSH,S_L,R_EDX)));
  180. popedx:=true;
  181. end;
  182. if hreg1<>R_EAX then
  183. begin
  184. if not(R_EAX in unused) then
  185. begin
  186. exprasmlist^.concat(new(pai386,op_reg(A_PUSH,S_L,R_EAX)));
  187. popeax:=true;
  188. end;
  189. emit_reg_reg(A_MOV,S_L,hreg1,R_EAX);
  190. end;
  191. end;
  192. { sign extension depends on the left type }
  193. if porddef(p^.left^.resulttype)^.typ=u32bit then
  194. exprasmlist^.concat(new(pai386,op_reg_reg(A_XOR,S_L,R_EDX,R_EDX)))
  195. else
  196. exprasmlist^.concat(new(pai386,op_none(A_CDQ,S_NO)));
  197. { division depends on the right type }
  198. if porddef(p^.right^.resulttype)^.typ=u32bit then
  199. exprasmlist^.concat(new(pai386,op_reg(A_DIV,S_L,R_EDI)))
  200. else
  201. exprasmlist^.concat(new(pai386,op_reg(A_IDIV,S_L,R_EDI)));
  202. if p^.treetype=divn then
  203. begin
  204. { if result register is busy then copy }
  205. if popeax then
  206. begin
  207. if hreg1=R_EAX then
  208. internalerror(112);
  209. emit_reg_reg(A_MOV,S_L,R_EAX,hreg1)
  210. end
  211. else
  212. if hreg1<>R_EAX then
  213. Begin
  214. ungetregister32(hreg1);
  215. hreg1 := getexplicitregister32(R_EAX);
  216. { I don't think it's possible that now hreg1 <> R_EAX
  217. since popeax is false, but for all certainty I do
  218. support that situation (JM)}
  219. if hreg1 <> R_EAX then
  220. emit_reg_reg(A_MOV,S_L,R_EAX,hreg1);
  221. end;
  222. end
  223. else
  224. {if we did the mod by an "and", the result is in hreg1 and
  225. EDX certainly hasn't been pushed (JM)}
  226. if not(andmod) Then
  227. if popedx then
  228. {the mod was done by an (i)div (so the result is now in
  229. edx), but edx was occupied prior to the division, so
  230. move the result into a safe place (JM)}
  231. emit_reg_reg(A_MOV,S_L,R_EDX,hreg1)
  232. else
  233. Begin
  234. {Get rid of the unnecessary hreg1 if possible (same as with
  235. EAX in divn) (JM)}
  236. ungetregister32(hreg1);
  237. hreg1 := getexplicitregister32(R_EDX);
  238. if hreg1 <> R_EDX then
  239. emit_reg_reg(A_MOV,S_L,R_EDX,hreg1);;
  240. End;
  241. if popeax then
  242. exprasmlist^.concat(new(pai386,op_reg(A_POP,S_L,R_EAX)));
  243. if popedx then
  244. exprasmlist^.concat(new(pai386,op_reg(A_POP,S_L,R_EDX)));
  245. end;
  246. If not(andmod or shrdiv) then
  247. {andmod and shrdiv only use hreg1 (which is already in usedinproc,
  248. since it was acquired with getregister), the others also use both
  249. EAX and EDX (JM)}
  250. Begin
  251. usedinproc:=usedinproc or ($80 shr byte(R_EAX));
  252. usedinproc:=usedinproc or ($80 shr byte(R_EDX));
  253. End;
  254. clear_location(p^.location);
  255. p^.location.loc:=LOC_REGISTER;
  256. p^.location.register:=hreg1;
  257. end;
  258. end;
  259. {*****************************************************************************
  260. SecondShlShr
  261. *****************************************************************************}
  262. procedure secondshlshr(var p : ptree);
  263. var
  264. hregister1,hregister2,hregister3,
  265. hregisterhigh,hregisterlow : tregister;
  266. pushed,popecx : boolean;
  267. op : tasmop;
  268. hr : preference;
  269. l1,l2,l3 : pasmlabel;
  270. begin
  271. popecx:=false;
  272. secondpass(p^.left);
  273. pushed:=maybe_push(p^.right^.registers32,p,is_64bitint(p^.left^.resulttype));
  274. secondpass(p^.right);
  275. if pushed then
  276. restore(p,is_64bitint(p^.left^.resulttype));
  277. if is_64bitint(p^.left^.resulttype) then
  278. begin
  279. { load left operator in a register }
  280. if p^.left^.location.loc<>LOC_REGISTER then
  281. begin
  282. if p^.left^.location.loc=LOC_CREGISTER then
  283. begin
  284. hregisterlow:=getregister32;
  285. hregisterhigh:=getregister32;
  286. emit_reg_reg(A_MOV,S_L,p^.left^.location.registerlow,
  287. hregisterlow);
  288. emit_reg_reg(A_MOV,S_L,p^.left^.location.registerhigh,
  289. hregisterlow);
  290. end
  291. else
  292. begin
  293. del_reference(p^.left^.location.reference);
  294. hregisterlow:=getregister32;
  295. hregisterhigh:=getregister32;
  296. exprasmlist^.concat(new(pai386,op_ref_reg(A_MOV,S_L,newreference(p^.left^.location.reference),
  297. hregisterlow)));
  298. hr:=newreference(p^.left^.location.reference);
  299. inc(hr^.offset,4);
  300. exprasmlist^.concat(new(pai386,op_ref_reg(A_MOV,S_L,hr,
  301. hregisterhigh)));
  302. end;
  303. end
  304. else
  305. begin
  306. hregisterlow:=p^.left^.location.registerlow;
  307. hregisterhigh:=p^.left^.location.registerhigh;
  308. end;
  309. { shifting by a constant directly coded: }
  310. if (p^.right^.treetype=ordconstn) then
  311. begin
  312. { shrd/shl works only for values <=31 !! }
  313. if p^.right^.value>31 then
  314. begin
  315. if p^.treetype=shln then
  316. begin
  317. exprasmlist^.concat(new(pai386,op_reg_reg(A_XOR,S_L,hregisterhigh,
  318. hregisterhigh)));
  319. exprasmlist^.concat(new(pai386,op_const_reg(A_SHL,S_L,p^.right^.value and 31,
  320. hregisterlow)));
  321. end
  322. else
  323. begin
  324. exprasmlist^.concat(new(pai386,op_reg_reg(A_XOR,S_L,hregisterlow,
  325. hregisterlow)));
  326. exprasmlist^.concat(new(pai386,op_const_reg(A_SHR,S_L,p^.right^.value and 31,
  327. hregisterhigh)));
  328. end;
  329. p^.location.registerhigh:=hregisterlow;
  330. p^.location.registerlow:=hregisterhigh;
  331. end
  332. else
  333. begin
  334. if p^.treetype=shln then
  335. begin
  336. exprasmlist^.concat(new(pai386,op_const_reg_reg(A_SHLD,S_L,p^.right^.value and 31,
  337. hregisterlow,hregisterhigh)));
  338. exprasmlist^.concat(new(pai386,op_const_reg(A_SHL,S_L,p^.right^.value and 31,
  339. hregisterlow)));
  340. end
  341. else
  342. begin
  343. exprasmlist^.concat(new(pai386,op_const_reg_reg(A_SHRD,S_L,p^.right^.value and 31,
  344. hregisterhigh,hregisterlow)));
  345. exprasmlist^.concat(new(pai386,op_const_reg(A_SHR,S_L,p^.right^.value and 31,
  346. hregisterhigh)));
  347. end;
  348. p^.location.registerlow:=hregisterlow;
  349. p^.location.registerhigh:=hregisterhigh;
  350. end;
  351. p^.location.loc:=LOC_REGISTER;
  352. end
  353. else
  354. begin
  355. { load right operators in a register }
  356. if p^.right^.location.loc<>LOC_REGISTER then
  357. begin
  358. if p^.right^.location.loc=LOC_CREGISTER then
  359. begin
  360. hregister2:=getexplicitregister32(R_ECX);
  361. emit_reg_reg(A_MOV,S_L,p^.right^.location.register,
  362. hregister2);
  363. end
  364. else
  365. begin
  366. del_reference(p^.right^.location.reference);
  367. hregister2:=getexplicitregister32(R_ECX);
  368. exprasmlist^.concat(new(pai386,op_ref_reg(A_MOV,S_L,newreference(p^.right^.location.reference),
  369. hregister2)));
  370. end;
  371. end
  372. else
  373. hregister2:=p^.right^.location.register;
  374. { left operator is already in a register }
  375. { hence are both in a register }
  376. { is it in the case ECX ? }
  377. if (hregisterlow=R_ECX) then
  378. begin
  379. { then only swap }
  380. emit_reg_reg(A_XCHG,S_L,hregisterlow,hregister2);
  381. hregister3:=hregisterlow;
  382. hregisterlow:=hregister2;
  383. hregister2:=hregister3;
  384. end
  385. else if (hregisterhigh=R_ECX) then
  386. begin
  387. { then only swap }
  388. emit_reg_reg(A_XCHG,S_L,hregisterhigh,hregister2);
  389. hregister3:=hregisterhigh;
  390. hregisterhigh:=hregister2;
  391. hregister2:=hregister3;
  392. end
  393. { if second operator not in ECX ? }
  394. else if (hregister2<>R_ECX) then
  395. begin
  396. { ECX occupied then push it }
  397. if not (R_ECX in unused) then
  398. begin
  399. popecx:=true;
  400. exprasmlist^.concat(new(pai386,op_reg(A_PUSH,S_L,R_ECX)));
  401. end;
  402. emit_reg_reg(A_MOV,S_L,hregister2,R_ECX);
  403. end;
  404. ungetregister32(hregister2);
  405. { the damned shift instructions work only til a count of 32 }
  406. { so we've to do some tricks here }
  407. if p^.treetype=shln then
  408. begin
  409. getlabel(l1);
  410. getlabel(l2);
  411. getlabel(l3);
  412. exprasmlist^.concat(new(pai386,op_const_reg(A_CMP,S_L,64,R_ECX)));
  413. emitjmp(C_L,l1);
  414. exprasmlist^.concat(new(pai386,op_reg_reg(A_XOR,S_L,hregisterlow,hregisterlow)));
  415. exprasmlist^.concat(new(pai386,op_reg_reg(A_XOR,S_L,hregisterhigh,hregisterhigh)));
  416. emitjmp(C_None,l3);
  417. emitlab(l1);
  418. exprasmlist^.concat(new(pai386,op_const_reg(A_CMP,S_L,32,R_ECX)));
  419. emitjmp(C_L,l2);
  420. exprasmlist^.concat(new(pai386,op_const_reg(A_SUB,S_L,32,R_ECX)));
  421. exprasmlist^.concat(new(pai386,op_reg_reg(A_SHL,S_L,R_CL,
  422. hregisterlow)));
  423. exprasmlist^.concat(new(pai386,op_reg_reg(A_MOV,S_L,hregisterlow,hregisterhigh)));
  424. exprasmlist^.concat(new(pai386,op_reg_reg(A_XOR,S_L,hregisterlow,hregisterlow)));
  425. emitjmp(C_None,l3);
  426. emitlab(l2);
  427. exprasmlist^.concat(new(pai386,op_reg_reg_reg(A_SHLD,S_L,R_CL,
  428. hregisterlow,hregisterhigh)));
  429. exprasmlist^.concat(new(pai386,op_reg_reg(A_SHL,S_L,R_CL,
  430. hregisterlow)));
  431. emitlab(l3);
  432. end
  433. else
  434. begin
  435. getlabel(l1);
  436. getlabel(l2);
  437. getlabel(l3);
  438. exprasmlist^.concat(new(pai386,op_const_reg(A_CMP,S_L,64,R_ECX)));
  439. emitjmp(C_L,l1);
  440. exprasmlist^.concat(new(pai386,op_reg_reg(A_XOR,S_L,hregisterlow,hregisterlow)));
  441. exprasmlist^.concat(new(pai386,op_reg_reg(A_XOR,S_L,hregisterhigh,hregisterhigh)));
  442. emitjmp(C_None,l3);
  443. emitlab(l1);
  444. exprasmlist^.concat(new(pai386,op_const_reg(A_CMP,S_L,32,R_ECX)));
  445. emitjmp(C_L,l2);
  446. exprasmlist^.concat(new(pai386,op_const_reg(A_SUB,S_L,32,R_ECX)));
  447. exprasmlist^.concat(new(pai386,op_reg_reg(A_SHR,S_L,R_CL,
  448. hregisterhigh)));
  449. exprasmlist^.concat(new(pai386,op_reg_reg(A_MOV,S_L,hregisterhigh,hregisterlow)));
  450. exprasmlist^.concat(new(pai386,op_reg_reg(A_XOR,S_L,hregisterhigh,hregisterhigh)));
  451. emitjmp(C_None,l3);
  452. emitlab(l2);
  453. exprasmlist^.concat(new(pai386,op_reg_reg_reg(A_SHRD,S_L,R_CL,
  454. hregisterhigh,hregisterlow)));
  455. exprasmlist^.concat(new(pai386,op_reg_reg(A_SHR,S_L,R_CL,
  456. hregisterhigh)));
  457. emitlab(l3);
  458. end;
  459. { maybe put ECX back }
  460. if popecx then
  461. exprasmlist^.concat(new(pai386,op_reg(A_POP,S_L,R_ECX)));
  462. p^.location.registerlow:=hregisterlow;
  463. p^.location.registerhigh:=hregisterhigh;
  464. end;
  465. end
  466. else
  467. begin
  468. { load left operators in a register }
  469. if p^.left^.location.loc<>LOC_REGISTER then
  470. begin
  471. if p^.left^.location.loc=LOC_CREGISTER then
  472. begin
  473. hregister1:=getregister32;
  474. emit_reg_reg(A_MOV,S_L,p^.left^.location.register,
  475. hregister1);
  476. end
  477. else
  478. begin
  479. del_reference(p^.left^.location.reference);
  480. hregister1:=getregister32;
  481. exprasmlist^.concat(new(pai386,op_ref_reg(A_MOV,S_L,newreference(p^.left^.location.reference),
  482. hregister1)));
  483. end;
  484. end
  485. else
  486. hregister1:=p^.left^.location.register;
  487. { determine operator }
  488. if p^.treetype=shln then
  489. op:=A_SHL
  490. else
  491. op:=A_SHR;
  492. { shifting by a constant directly coded: }
  493. if (p^.right^.treetype=ordconstn) then
  494. begin
  495. { l shl 32 should 0 imho, but neither TP nor Delphi do it in this way (FK)
  496. if p^.right^.value<=31 then
  497. }
  498. exprasmlist^.concat(new(pai386,op_const_reg(op,S_L,p^.right^.value and 31,
  499. hregister1)));
  500. {
  501. else
  502. exprasmlist^.concat(new(pai386,op_reg_reg(A_XOR,S_L,hregister1,
  503. hregister1)));
  504. }
  505. p^.location.loc:=LOC_REGISTER;
  506. p^.location.register:=hregister1;
  507. end
  508. else
  509. begin
  510. { load right operators in a register }
  511. if p^.right^.location.loc<>LOC_REGISTER then
  512. begin
  513. if p^.right^.location.loc=LOC_CREGISTER then
  514. begin
  515. hregister2:=getexplicitregister32(R_ECX);
  516. emit_reg_reg(A_MOV,S_L,p^.right^.location.register,
  517. hregister2);
  518. end
  519. else
  520. begin
  521. del_reference(p^.right^.location.reference);
  522. hregister2:=getexplicitregister32(R_ECX);
  523. exprasmlist^.concat(new(pai386,op_ref_reg(A_MOV,S_L,newreference(p^.right^.location.reference),
  524. hregister2)));
  525. end;
  526. end
  527. else
  528. hregister2:=p^.right^.location.register;
  529. { left operator is already in a register }
  530. { hence are both in a register }
  531. { is it in the case ECX ? }
  532. if (hregister1=R_ECX) then
  533. begin
  534. { then only swap }
  535. emit_reg_reg(A_XCHG,S_L,hregister1,hregister2);
  536. hregister3:=hregister1;
  537. hregister1:=hregister2;
  538. hregister2:=hregister3;
  539. end
  540. { if second operator not in ECX ? }
  541. else if (hregister2<>R_ECX) then
  542. begin
  543. { ECX occupied then push it }
  544. if not (R_ECX in unused) then
  545. begin
  546. popecx:=true;
  547. exprasmlist^.concat(new(pai386,op_reg(A_PUSH,S_L,R_ECX)));
  548. end;
  549. emit_reg_reg(A_MOV,S_L,hregister2,R_ECX);
  550. end;
  551. ungetregister32(hregister2);
  552. { right operand is in ECX }
  553. emit_reg_reg(op,S_L,R_CL,hregister1);
  554. { maybe ECX back }
  555. if popecx then
  556. exprasmlist^.concat(new(pai386,op_reg(A_POP,S_L,R_ECX)));
  557. p^.location.register:=hregister1;
  558. end;
  559. end;
  560. end;
  561. {*****************************************************************************
  562. SecondUmMinus
  563. *****************************************************************************}
  564. procedure secondumminus(var p : ptree);
  565. {$ifdef SUPPORT_MMX}
  566. procedure do_mmx_neg;
  567. var
  568. op : tasmop;
  569. begin
  570. p^.location.loc:=LOC_MMXREGISTER;
  571. if cs_mmx_saturation in aktlocalswitches then
  572. case mmx_type(p^.resulttype) of
  573. mmxs8bit:
  574. op:=A_PSUBSB;
  575. mmxu8bit:
  576. op:=A_PSUBUSB;
  577. mmxs16bit,mmxfixed16:
  578. op:=A_PSUBSW;
  579. mmxu16bit:
  580. op:=A_PSUBUSW;
  581. end
  582. else
  583. case mmx_type(p^.resulttype) of
  584. mmxs8bit,mmxu8bit:
  585. op:=A_PSUBB;
  586. mmxs16bit,mmxu16bit,mmxfixed16:
  587. op:=A_PSUBW;
  588. mmxs32bit,mmxu32bit:
  589. op:=A_PSUBD;
  590. end;
  591. emit_reg_reg(op,S_NO,p^.location.register,R_MM7);
  592. emit_reg_reg(A_MOVQ,S_NO,R_MM7,p^.location.register);
  593. end;
  594. {$endif}
  595. var
  596. hr : preference;
  597. begin
  598. if is_64bitint(p^.left^.resulttype) then
  599. begin
  600. secondpass(p^.left);
  601. clear_location(p^.location);
  602. p^.location.loc:=LOC_REGISTER;
  603. case p^.left^.location.loc of
  604. LOC_REGISTER :
  605. begin
  606. p^.location.registerlow:=p^.left^.location.registerlow;
  607. p^.location.registerhigh:=p^.left^.location.registerhigh;
  608. end;
  609. LOC_CREGISTER :
  610. begin
  611. p^.location.registerlow:=getregister32;
  612. p^.location.registerhigh:=getregister32;
  613. emit_reg_reg(A_MOV,S_L,p^.left^.location.registerlow,p^.location.registerlow);
  614. emit_reg_reg(A_MOV,S_L,p^.left^.location.registerhigh,p^.location.registerhigh);
  615. end;
  616. LOC_REFERENCE,LOC_MEM :
  617. begin
  618. del_reference(p^.left^.location.reference);
  619. p^.location.registerlow:=getregister32;
  620. p^.location.registerhigh:=getregister32;
  621. exprasmlist^.concat(new(pai386,op_ref_reg(A_MOV,S_L,
  622. newreference(p^.left^.location.reference),p^.location.registerlow)));
  623. hr:=newreference(p^.left^.location.reference);
  624. inc(hr^.offset,4);
  625. exprasmlist^.concat(new(pai386,op_ref_reg(A_MOV,S_L,
  626. hr,p^.location.registerhigh)));
  627. end;
  628. end;
  629. exprasmlist^.concat(new(pai386,op_reg(A_NEG,S_L,p^.location.registerlow)));
  630. exprasmlist^.concat(new(pai386,op_const_reg(A_ADC,S_L,0,p^.location.registerhigh)));
  631. exprasmlist^.concat(new(pai386,op_reg(A_NEG,S_L,p^.location.registerhigh)));
  632. end
  633. else
  634. begin
  635. secondpass(p^.left);
  636. p^.location.loc:=LOC_REGISTER;
  637. case p^.left^.location.loc of
  638. LOC_REGISTER:
  639. begin
  640. p^.location.register:=p^.left^.location.register;
  641. exprasmlist^.concat(new(pai386,op_reg(A_NEG,S_L,p^.location.register)));
  642. end;
  643. LOC_CREGISTER:
  644. begin
  645. p^.location.register:=getregister32;
  646. emit_reg_reg(A_MOV,S_L,p^.location.register,
  647. p^.location.register);
  648. exprasmlist^.concat(new(pai386,op_reg(A_NEG,S_L,p^.location.register)));
  649. end;
  650. {$ifdef SUPPORT_MMX}
  651. LOC_MMXREGISTER:
  652. begin
  653. set_location(p^.location,p^.left^.location);
  654. emit_reg_reg(A_PXOR,S_NO,R_MM7,R_MM7);
  655. do_mmx_neg;
  656. end;
  657. LOC_CMMXREGISTER:
  658. begin
  659. p^.location.register:=getregistermmx;
  660. emit_reg_reg(A_PXOR,S_NO,R_MM7,R_MM7);
  661. emit_reg_reg(A_MOVQ,S_NO,p^.left^.location.register,
  662. p^.location.register);
  663. do_mmx_neg;
  664. end;
  665. {$endif SUPPORT_MMX}
  666. LOC_REFERENCE,LOC_MEM:
  667. begin
  668. del_reference(p^.left^.location.reference);
  669. if (p^.left^.resulttype^.deftype=floatdef) and
  670. (pfloatdef(p^.left^.resulttype)^.typ<>f32bit) then
  671. begin
  672. p^.location.loc:=LOC_FPU;
  673. floatload(pfloatdef(p^.left^.resulttype)^.typ,
  674. p^.left^.location.reference);
  675. exprasmlist^.concat(new(pai386,op_none(A_FCHS,S_NO)));
  676. end
  677. {$ifdef SUPPORT_MMX}
  678. else if (cs_mmx in aktlocalswitches) and is_mmx_able_array(p^.left^.resulttype) then
  679. begin
  680. p^.location.register:=getregistermmx;
  681. emit_reg_reg(A_PXOR,S_NO,R_MM7,R_MM7);
  682. exprasmlist^.concat(new(pai386,op_ref_reg(A_MOVQ,S_NO,
  683. newreference(p^.left^.location.reference),
  684. p^.location.register)));
  685. do_mmx_neg;
  686. end
  687. {$endif SUPPORT_MMX}
  688. else
  689. begin
  690. p^.location.register:=getregister32;
  691. exprasmlist^.concat(new(pai386,op_ref_reg(A_MOV,S_L,
  692. newreference(p^.left^.location.reference),
  693. p^.location.register)));
  694. exprasmlist^.concat(new(pai386,op_reg(A_NEG,S_L,p^.location.register)));
  695. end;
  696. end;
  697. LOC_FPU:
  698. begin
  699. p^.location.loc:=LOC_FPU;
  700. exprasmlist^.concat(new(pai386,op_none(A_FCHS,S_NO)));
  701. end;
  702. end;
  703. end;
  704. { Here was a problem... }
  705. { Operand to be negated always }
  706. { seems to be converted to signed }
  707. { 32-bit before doing neg!! }
  708. { So this is useless... }
  709. { emitoverflowcheck(p);}
  710. end;
  711. {*****************************************************************************
  712. SecondNot
  713. *****************************************************************************}
  714. procedure secondnot(var p : ptree);
  715. const
  716. flagsinvers : array[F_E..F_BE] of tresflags =
  717. (F_NE,F_E,F_LE,F_GE,F_L,F_G,F_NC,F_C,
  718. F_A,F_AE,F_B,F_BE);
  719. var
  720. hl : pasmlabel;
  721. opsize : topsize;
  722. hr : preference;
  723. begin
  724. if is_boolean(p^.resulttype) then
  725. begin
  726. opsize:=def_opsize(p^.resulttype);
  727. case p^.left^.location.loc of
  728. LOC_JUMP :
  729. begin
  730. hl:=truelabel;
  731. truelabel:=falselabel;
  732. falselabel:=hl;
  733. secondpass(p^.left);
  734. maketojumpbool(p^.left);
  735. hl:=truelabel;
  736. truelabel:=falselabel;
  737. falselabel:=hl;
  738. end;
  739. LOC_FLAGS :
  740. begin
  741. secondpass(p^.left);
  742. p^.location.resflags:=flagsinvers[p^.left^.location.resflags];
  743. end;
  744. LOC_REGISTER :
  745. begin
  746. secondpass(p^.left);
  747. {p^.location.register:=p^.left^.location.register;
  748. exprasmlist^.concat(new(pai386,op_const_reg(A_XOR,opsize,1,p^.location.register)));}
  749. p^.location.loc:=LOC_FLAGS;
  750. p^.location.resflags:=F_E;
  751. exprasmlist^.concat(new(pai386,op_reg_reg(A_TEST,opsize,
  752. p^.left^.location.register,p^.left^.location.register)));
  753. ungetregister(p^.left^.location.register);
  754. end;
  755. LOC_CREGISTER :
  756. begin
  757. secondpass(p^.left);
  758. clear_location(p^.location);
  759. p^.location.loc:=LOC_REGISTER;
  760. p^.location.register:=def_getreg(p^.resulttype);
  761. emit_reg_reg(A_MOV,opsize,p^.left^.location.register,p^.location.register);
  762. exprasmlist^.concat(new(pai386,op_reg_reg(A_TEST,opsize,p^.location.register,p^.location.register)));
  763. ungetregister(p^.location.register);
  764. p^.location.loc:=LOC_FLAGS;
  765. p^.location.resflags:=F_E;
  766. end;
  767. LOC_REFERENCE,
  768. LOC_MEM :
  769. begin
  770. secondpass(p^.left);
  771. clear_location(p^.location);
  772. p^.location.loc:=LOC_REGISTER;
  773. del_reference(p^.left^.location.reference);
  774. { this was placed before del_ref => internaalerror(10) }
  775. p^.location.register:=def_getreg(p^.resulttype);
  776. exprasmlist^.concat(new(pai386,op_ref_reg(A_MOV,opsize,
  777. newreference(p^.left^.location.reference),p^.location.register)));
  778. exprasmlist^.concat(new(pai386,op_reg_reg(A_TEST,opsize,p^.location.register,p^.location.register)));
  779. ungetregister(p^.location.register);
  780. p^.location.loc:=LOC_FLAGS;
  781. p^.location.resflags:=F_E;
  782. end;
  783. end;
  784. end
  785. {$ifdef SUPPORT_MMX}
  786. else
  787. if (cs_mmx in aktlocalswitches) and is_mmx_able_array(p^.left^.resulttype) then
  788. begin
  789. secondpass(p^.left);
  790. p^.location.loc:=LOC_MMXREGISTER;
  791. { prepare EDI }
  792. exprasmlist^.concat(new(pai386,op_const_reg(A_MOV,S_L,$ffffffff,R_EDI)));
  793. { load operand }
  794. case p^.left^.location.loc of
  795. LOC_MMXREGISTER:
  796. set_location(p^.location,p^.left^.location);
  797. LOC_CMMXREGISTER:
  798. begin
  799. p^.location.register:=getregistermmx;
  800. emit_reg_reg(A_MOVQ,S_NO,p^.left^.location.register,p^.location.register);
  801. end;
  802. LOC_REFERENCE,LOC_MEM:
  803. begin
  804. del_reference(p^.left^.location.reference);
  805. p^.location.register:=getregistermmx;
  806. exprasmlist^.concat(new(pai386,op_ref_reg(A_MOVQ,S_NO,
  807. newreference(p^.left^.location.reference),p^.location.register)));
  808. end;
  809. end;
  810. { load mask }
  811. emit_reg_reg(A_MOV,S_D,R_EDI,R_MM7);
  812. { lower 32 bit }
  813. emit_reg_reg(A_PXOR,S_D,R_MM7,p^.location.register);
  814. { shift mask }
  815. exprasmlist^.concat(new(pai386,op_const_reg(A_PSLLQ,S_NO,32,R_MM7)));
  816. { higher 32 bit }
  817. emit_reg_reg(A_PXOR,S_D,R_MM7,p^.location.register);
  818. end
  819. {$endif SUPPORT_MMX}
  820. else if is_64bitint(p^.left^.resulttype) then
  821. begin
  822. secondpass(p^.left);
  823. clear_location(p^.location);
  824. p^.location.loc:=LOC_REGISTER;
  825. case p^.left^.location.loc of
  826. LOC_REGISTER :
  827. begin
  828. p^.location.registerlow:=p^.left^.location.registerlow;
  829. p^.location.registerhigh:=p^.left^.location.registerhigh;
  830. exprasmlist^.concat(new(pai386,op_reg(A_NOT,S_L,p^.location.registerlow)));
  831. exprasmlist^.concat(new(pai386,op_reg(A_NOT,S_L,p^.location.registerhigh)));
  832. end;
  833. LOC_CREGISTER :
  834. begin
  835. p^.location.registerlow:=getregister32;
  836. p^.location.registerhigh:=getregister32;
  837. emit_reg_reg(A_MOV,S_L,p^.left^.location.registerlow,p^.location.registerlow);
  838. emit_reg_reg(A_MOV,S_L,p^.left^.location.registerhigh,p^.location.registerhigh);
  839. exprasmlist^.concat(new(pai386,op_reg(A_NOT,S_L,p^.location.registerlow)));
  840. exprasmlist^.concat(new(pai386,op_reg(A_NOT,S_L,p^.location.registerhigh)));
  841. end;
  842. LOC_REFERENCE,LOC_MEM :
  843. begin
  844. del_reference(p^.left^.location.reference);
  845. p^.location.registerlow:=getregister32;
  846. p^.location.registerhigh:=getregister32;
  847. exprasmlist^.concat(new(pai386,op_ref_reg(A_MOV,S_L,
  848. newreference(p^.left^.location.reference),p^.location.registerlow)));
  849. hr:=newreference(p^.left^.location.reference);
  850. inc(hr^.offset,4);
  851. exprasmlist^.concat(new(pai386,op_ref_reg(A_MOV,S_L,
  852. hr,p^.location.registerhigh)));
  853. exprasmlist^.concat(new(pai386,op_reg(A_NOT,S_L,p^.location.registerlow)));
  854. exprasmlist^.concat(new(pai386,op_reg(A_NOT,S_L,p^.location.registerhigh)));
  855. end;
  856. end;
  857. end
  858. else
  859. begin
  860. secondpass(p^.left);
  861. clear_location(p^.location);
  862. p^.location.loc:=LOC_REGISTER;
  863. case p^.left^.location.loc of
  864. LOC_REGISTER :
  865. begin
  866. p^.location.register:=p^.left^.location.register;
  867. exprasmlist^.concat(new(pai386,op_reg(A_NOT,S_L,p^.location.register)));
  868. end;
  869. LOC_CREGISTER :
  870. begin
  871. p^.location.register:=getregister32;
  872. emit_reg_reg(A_MOV,S_L,p^.left^.location.register,p^.location.register);
  873. exprasmlist^.concat(new(pai386,op_reg(A_NOT,S_L,p^.location.register)));
  874. end;
  875. LOC_REFERENCE,LOC_MEM :
  876. begin
  877. del_reference(p^.left^.location.reference);
  878. p^.location.register:=getregister32;
  879. exprasmlist^.concat(new(pai386,op_ref_reg(A_MOV,S_L,
  880. newreference(p^.left^.location.reference),p^.location.register)));
  881. exprasmlist^.concat(new(pai386,op_reg(A_NOT,S_L,p^.location.register)));
  882. end;
  883. end;
  884. end;
  885. end;
  886. end.
  887. {
  888. $Log$
  889. Revision 1.26 1999-06-02 10:11:44 florian
  890. * make cycle fixed i.e. compilation with 0.99.10
  891. * some fixes for qword
  892. * start of register calling conventions
  893. Revision 1.25 1999/05/27 19:44:16 peter
  894. * removed oldasm
  895. * plabel -> pasmlabel
  896. * -a switches to source writing automaticly
  897. * assembler readers OOPed
  898. * asmsymbol automaticly external
  899. * jumptables and other label fixes for asm readers
  900. Revision 1.24 1999/05/25 20:36:13 florian
  901. * some bugs in the qword code generation fixed
  902. Revision 1.23 1999/05/08 20:41:08 jonas
  903. + positive number MOD power of 2 now done with AND instruction
  904. * fix to division of positive numbers by power of 2
  905. * the result of a MOD is left in EDX if possible
  906. Revision 1.22 1999/05/01 13:24:11 peter
  907. * merged nasm compiler
  908. * old asm moved to oldasm/
  909. Revision 1.21 1999/04/16 13:42:27 jonas
  910. * more regalloc fixes (still not complete)
  911. Revision 1.20 1999/02/22 02:15:13 peter
  912. * updates for ag386bin
  913. Revision 1.19 1999/02/04 10:49:40 florian
  914. + range checking for ansi- and widestrings
  915. * made it compilable with TP
  916. Revision 1.18 1999/02/03 10:11:12 pierre
  917. * fix for bug0211 for i386
  918. Revision 1.17 1999/01/21 22:10:41 peter
  919. * fixed array of const
  920. * generic platform independent high() support
  921. Revision 1.16 1999/01/19 10:51:32 pierre
  922. * fix to bug0183 in secondnot
  923. Revision 1.15 1998/12/11 16:50:22 florian
  924. + typed const int64 and qword
  925. + unary minus-operator q1:=-q2;
  926. + not-operator
  927. Revision 1.14 1998/12/11 16:10:07 florian
  928. + shifting for 64 bit ints added
  929. * bug in getexplicitregister32 fixed: usableregs wasn't decremented !!
  930. Revision 1.13 1998/12/11 00:02:52 peter
  931. + globtype,tokens,version unit splitted from globals
  932. Revision 1.12 1998/11/26 21:45:29 jonas
  933. - removed A_CLTD opcode (use A_CDQ instead)
  934. * changed cbw, cwde and cwd to cbtw, cwtl and cwtd in att_op2str array
  935. * in daopt386: adapted AsmInstr array to reflect changes + fixed line too long
  936. Revision 1.11 1998/11/05 14:26:02 peter
  937. * fixed shlshr which would push ecx when not needed
  938. Revision 1.10 1998/10/20 13:12:38 peter
  939. * fixed 'not not boolean', the location was not set to register
  940. Revision 1.9 1998/10/20 08:06:42 pierre
  941. * several memory corruptions due to double freemem solved
  942. => never use p^.loc.location:=p^.left^.loc.location;
  943. + finally I added now by default
  944. that ra386dir translates global and unit symbols
  945. + added a first field in tsymtable and
  946. a nextsym field in tsym
  947. (this allows to obtain ordered type info for
  948. records and objects in gdb !)
  949. Revision 1.8 1998/10/09 08:56:24 pierre
  950. * several memory leaks fixed
  951. Revision 1.7 1998/09/17 09:42:17 peter
  952. + pass_2 for cg386
  953. * Message() -> CGMessage() for pass_1/pass_2
  954. Revision 1.6 1998/09/09 14:37:37 florian
  955. * mod/div for cardinal type fixed
  956. Revision 1.5 1998/08/23 16:07:20 florian
  957. * internalerror with mod/div fixed
  958. Revision 1.4 1998/08/18 09:24:38 pierre
  959. * small warning position bug fixed
  960. * support_mmx switches splitting was missing
  961. * rhide error and warning output corrected
  962. Revision 1.3 1998/06/05 17:44:12 peter
  963. * splitted cgi386
  964. Revision 1.2 1998/06/02 17:02:59 pierre
  965. * with node corrected for objects
  966. * small bugs for SUPPORT_MMX fixed
  967. Revision 1.1 1998/06/01 16:50:18 peter
  968. + boolean -> ord conversion
  969. * fixed ord -> boolean conversion
  970. }